Warning: Permanently added '2620:52:3:1:dead:beef:cafe:c112' (ED25519) to the list of known hosts. You can reproduce this build on your computer by running: sudo dnf install copr-rpmbuild /usr/bin/copr-rpmbuild --verbose --drop-resultdir --task-url https://copr.fedorainfracloud.org/backend/get-build-task/9314147-fedora-rawhide-x86_64 --chroot fedora-rawhide-x86_64 Version: 1.3 PID: 2855 Logging PID: 2856 Task: {'allow_user_ssh': False, 'appstream': False, 'background': True, 'build_id': 9314147, 'buildroot_pkgs': [], 'chroot': 'fedora-rawhide-x86_64', 'enable_net': False, 'fedora_review': False, 'git_hash': 'ce7e37371920aa474807c22e7c18fc119485ad01', 'git_repo': 'https://copr-dist-git.fedorainfracloud.org/git/@rocm-packagers-sig/RH/rccl', 'isolation': 'default', 'memory_reqs': 2048, 'package_name': 'rccl', 'package_version': '6.4.2-1', 'project_dirname': 'RH', 'project_name': 'RH', 'project_owner': '@rocm-packagers-sig', 'repo_priority': None, 'repos': [{'baseurl': 'https://download.copr.fedorainfracloud.org/results/@rocm-packagers-sig/RH/fedora-rawhide-x86_64/', 'id': 'copr_base', 'name': 'Copr repository', 'priority': None}], 'sandbox': '@rocm-packagers-sig/RH--https://src.fedoraproject.org/user/mystro256', 'source_json': {}, 'source_type': None, 'ssh_public_keys': None, 'storage': 0, 'submitter': 'https://src.fedoraproject.org/user/mystro256', 'tags': [], 'task_id': '9314147-fedora-rawhide-x86_64', 'timeout': 18000, 'uses_devel_repo': False, 'with_opts': [], 'without_opts': []} Running: git clone https://copr-dist-git.fedorainfracloud.org/git/@rocm-packagers-sig/RH/rccl /var/lib/copr-rpmbuild/workspace/workdir-q88lb_0o/rccl --depth 500 --no-single-branch --recursive cmd: ['git', 'clone', 'https://copr-dist-git.fedorainfracloud.org/git/@rocm-packagers-sig/RH/rccl', '/var/lib/copr-rpmbuild/workspace/workdir-q88lb_0o/rccl', '--depth', '500', '--no-single-branch', '--recursive'] cwd: . rc: 0 stdout: stderr: Cloning into '/var/lib/copr-rpmbuild/workspace/workdir-q88lb_0o/rccl'... Running: git checkout ce7e37371920aa474807c22e7c18fc119485ad01 -- cmd: ['git', 'checkout', 'ce7e37371920aa474807c22e7c18fc119485ad01', '--'] cwd: /var/lib/copr-rpmbuild/workspace/workdir-q88lb_0o/rccl rc: 0 stdout: stderr: Note: switching to 'ce7e37371920aa474807c22e7c18fc119485ad01'. You are in 'detached HEAD' state. You can look around, make experimental changes and commit them, and you can discard any commits you make in this state without impacting any branches by switching back to a branch. If you want to create a new branch to retain commits you create, you may do so (now or later) by using -c with the switch command. Example: git switch -c Or undo this operation with: git switch - Turn off this advice by setting config variable advice.detachedHead to false HEAD is now at ce7e373 automatic import of rccl Running: dist-git-client sources cmd: ['dist-git-client', 'sources'] cwd: /var/lib/copr-rpmbuild/workspace/workdir-q88lb_0o/rccl rc: 0 stdout: stderr: INFO: Reading stdout from command: git rev-parse --abbrev-ref HEAD INFO: Reading stdout from command: git rev-parse HEAD INFO: Reading sources specification file: sources INFO: Downloading RCCL-6.4.2.tar.gz INFO: Reading stdout from command: curl --help all tail: /var/lib/copr-rpmbuild/main.log: file truncated INFO: Calling: curl -H Pragma: -o RCCL-6.4.2.tar.gz --location --connect-timeout 60 --retry 3 --retry-delay 10 --remote-time --show-error --fail --retry-all-errors https://copr-dist-git.fedorainfracloud.org/repo/pkgs/@rocm-packagers-sig/RH/rccl/RCCL-6.4.2.tar.gz/md5/5323c56546d4e3634f04898820e8816c/RCCL-6.4.2.tar.gz % Total % Received % Xferd Average Speed Time Time Time Current Dload Upload Total Spent Left Speed 100 1851k 100 1851k 0 0 19.4M 0 --:--:-- --:--:-- --:--:-- 19.6M INFO: Reading stdout from command: md5sum RCCL-6.4.2.tar.gz Running (timeout=18000): unbuffer mock --spec /var/lib/copr-rpmbuild/workspace/workdir-q88lb_0o/rccl/rccl.spec --sources /var/lib/copr-rpmbuild/workspace/workdir-q88lb_0o/rccl --resultdir /var/lib/copr-rpmbuild/results --uniqueext 1753289447.166372 -r /var/lib/copr-rpmbuild/results/configs/child.cfg INFO: mock.py version 6.3 starting (python version = 3.13.3, NVR = mock-6.3-1.fc42), args: /usr/libexec/mock/mock --spec /var/lib/copr-rpmbuild/workspace/workdir-q88lb_0o/rccl/rccl.spec --sources /var/lib/copr-rpmbuild/workspace/workdir-q88lb_0o/rccl --resultdir /var/lib/copr-rpmbuild/results --uniqueext 1753289447.166372 -r /var/lib/copr-rpmbuild/results/configs/child.cfg Start(bootstrap): init plugins INFO: tmpfs initialized INFO: selinux enabled INFO: chroot_scan: initialized INFO: compress_logs: initialized Finish(bootstrap): init plugins Start: init plugins INFO: tmpfs initialized INFO: selinux enabled INFO: chroot_scan: initialized INFO: compress_logs: initialized Finish: init plugins INFO: Signal handler active Start: run INFO: Start(/var/lib/copr-rpmbuild/workspace/workdir-q88lb_0o/rccl/rccl.spec) Config(fedora-rawhide-x86_64) Start: clean chroot Finish: clean chroot Mock Version: 6.3 INFO: Mock Version: 6.3 Start(bootstrap): chroot init INFO: mounting tmpfs at /var/lib/mock/fedora-rawhide-x86_64-bootstrap-1753289447.166372/root. INFO: calling preinit hooks INFO: enabled root cache INFO: enabled package manager cache Start(bootstrap): cleaning package manager metadata Finish(bootstrap): cleaning package manager metadata INFO: Guessed host environment type: unknown INFO: Using container image: registry.fedoraproject.org/fedora:rawhide INFO: Pulling image: registry.fedoraproject.org/fedora:rawhide INFO: Tagging container image as mock-bootstrap-5629703d-f4ce-483f-b31d-449e22738039 INFO: Checking that 772e8ca99d4ee24821ae410b5935c40d0807fa0836da3933ad5db6fe20de6b82 image matches host's architecture INFO: Copy content of container 772e8ca99d4ee24821ae410b5935c40d0807fa0836da3933ad5db6fe20de6b82 to /var/lib/mock/fedora-rawhide-x86_64-bootstrap-1753289447.166372/root INFO: mounting 772e8ca99d4ee24821ae410b5935c40d0807fa0836da3933ad5db6fe20de6b82 with podman image mount INFO: image 772e8ca99d4ee24821ae410b5935c40d0807fa0836da3933ad5db6fe20de6b82 as /var/lib/containers/storage/overlay/1b09b4e95c8bad02eb01ebcb7776ff2a89e911f227d7f83f2cb11d567610ea44/merged INFO: umounting image 772e8ca99d4ee24821ae410b5935c40d0807fa0836da3933ad5db6fe20de6b82 (/var/lib/containers/storage/overlay/1b09b4e95c8bad02eb01ebcb7776ff2a89e911f227d7f83f2cb11d567610ea44/merged) with podman image umount INFO: Removing image mock-bootstrap-5629703d-f4ce-483f-b31d-449e22738039 INFO: Package manager dnf5 detected and used (fallback) INFO: Not updating bootstrap chroot, bootstrap_image_ready=True Start(bootstrap): creating root cache Finish(bootstrap): creating root cache Finish(bootstrap): chroot init Start: chroot init INFO: mounting tmpfs at /var/lib/mock/fedora-rawhide-x86_64-1753289447.166372/root. INFO: calling preinit hooks INFO: enabled root cache INFO: enabled package manager cache Start: cleaning package manager metadata Finish: cleaning package manager metadata INFO: enabled HW Info plugin INFO: Package manager dnf5 detected and used (direct choice) INFO: Buildroot is handled by package management downloaded with a bootstrap image: rpm-5.99.91-1.fc43.x86_64 rpm-sequoia-1.9.0-1.fc43.x86_64 dnf5-5.2.15.0-1.fc43.x86_64 dnf5-plugins-5.2.15.0-1.fc43.x86_64 Start: installing minimal buildroot with dnf5 Updating and loading repositories: Copr repository 100% | 1.3 MiB/s | 201.8 KiB | 00m00s fedora 100% | 19.3 MiB/s | 21.8 MiB | 00m01s Repositories loaded. Package Arch Version Repository Size Installing group/module packages: bash x86_64 5.3.0-1.fc43 fedora 8.4 MiB bzip2 x86_64 1.0.8-20.fc42 fedora 99.3 KiB coreutils x86_64 9.7-4.fc43 fedora 5.4 MiB cpio x86_64 2.15-2.fc41 fedora 1.1 MiB diffutils x86_64 3.12-2.fc43 fedora 1.6 MiB fedora-release-common noarch 43-0.19 fedora 20.4 KiB findutils x86_64 1:4.10.0-5.fc42 fedora 1.9 MiB gawk x86_64 5.3.2-1.fc43 fedora 1.8 MiB glibc-minimal-langpack x86_64 2.41.9000-23.fc43 fedora 0.0 B grep x86_64 3.12-1.fc43 fedora 1.0 MiB gzip x86_64 1.13-3.fc42 fedora 392.9 KiB info x86_64 7.2-4.fc43 fedora 353.9 KiB patch x86_64 2.8-1.fc43 fedora 226.8 KiB redhat-rpm-config noarch 343-7.fc43 fedora 181.7 KiB rpm-build x86_64 5.99.91-1.fc43 fedora 289.6 KiB sed x86_64 4.9-4.fc42 fedora 857.3 KiB shadow-utils x86_64 2:4.18.0-1.fc43 fedora 3.9 MiB tar x86_64 2:1.35-5.fc42 fedora 3.0 MiB unzip x86_64 6.0-66.fc42 fedora 390.3 KiB util-linux x86_64 2.41.1-11.fc43 fedora 3.5 MiB which x86_64 2.23-2.fc43 fedora 83.5 KiB xz x86_64 1:5.8.1-1.fc43 fedora 1.3 MiB Installing dependencies: add-determinism x86_64 0.6.0-1.fc43 fedora 2.5 MiB alternatives x86_64 1.33-1.fc43 fedora 62.2 KiB ansible-srpm-macros noarch 1-17.1.fc42 fedora 35.7 KiB audit-libs x86_64 4.1.0-1.fc43 fedora 378.8 KiB binutils x86_64 2.44.90-2.fc43 fedora 26.4 MiB build-reproducibility-srpm-macros noarch 0.6.0-1.fc43 fedora 735.0 B bzip2-libs x86_64 1.0.8-20.fc42 fedora 84.6 KiB ca-certificates noarch 2024.2.69_v8.0.401-5.fc42 fedora 2.6 MiB coreutils-common x86_64 9.7-4.fc43 fedora 11.3 MiB crypto-policies noarch 20250714-1.gitcd6043a.fc43 fedora 146.9 KiB curl x86_64 8.15.0-1.fc43 fedora 473.6 KiB cyrus-sasl-lib x86_64 2.1.28-30.fc42 fedora 2.3 MiB debugedit x86_64 5.2-1.fc43 fedora 197.8 KiB dwz x86_64 0.16-1.fc43 fedora 287.1 KiB ed x86_64 1.21.1-1.fc43 fedora 142.8 KiB efi-srpm-macros noarch 6-3.fc43 fedora 40.1 KiB elfutils x86_64 0.193-2.fc43 fedora 2.9 MiB elfutils-debuginfod-client x86_64 0.193-2.fc43 fedora 83.9 KiB elfutils-default-yama-scope noarch 0.193-2.fc43 fedora 1.8 KiB elfutils-libelf x86_64 0.193-2.fc43 fedora 1.2 MiB elfutils-libs x86_64 0.193-2.fc43 fedora 683.4 KiB fedora-gpg-keys noarch 43-0.2 fedora 129.0 KiB fedora-release noarch 43-0.19 fedora 0.0 B fedora-release-identity-basic noarch 43-0.19 fedora 664.0 B fedora-repos noarch 43-0.2 fedora 4.9 KiB fedora-repos-rawhide noarch 43-0.2 fedora 2.2 KiB file x86_64 5.46-5.fc43 fedora 100.2 KiB file-libs x86_64 5.46-5.fc43 fedora 11.9 MiB filesystem x86_64 3.18-44.fc43 fedora 112.0 B filesystem-srpm-macros noarch 3.18-44.fc43 fedora 38.2 KiB fonts-srpm-macros noarch 1:2.0.5-22.fc43 fedora 55.8 KiB forge-srpm-macros noarch 0.4.0-2.fc42 fedora 38.9 KiB fpc-srpm-macros noarch 1.3-14.fc42 fedora 144.0 B gdb-minimal x86_64 16.3-3.fc43 fedora 13.2 MiB gdbm-libs x86_64 1:1.23-9.fc42 fedora 129.9 KiB ghc-srpm-macros noarch 1.9.2-2.fc42 fedora 779.0 B glibc x86_64 2.41.9000-23.fc43 fedora 6.7 MiB glibc-common x86_64 2.41.9000-23.fc43 fedora 1.0 MiB glibc-gconv-extra x86_64 2.41.9000-23.fc43 fedora 7.2 MiB gmp x86_64 1:6.3.0-3.fc43 fedora 819.2 KiB gnat-srpm-macros noarch 6-7.fc42 fedora 1.0 KiB gnupg2 x86_64 2.4.8-2.fc43 fedora 6.5 MiB gnupg2-dirmngr x86_64 2.4.8-2.fc43 fedora 618.4 KiB gnupg2-gpg-agent x86_64 2.4.8-2.fc43 fedora 671.4 KiB gnupg2-gpgconf x86_64 2.4.8-2.fc43 fedora 250.0 KiB gnupg2-keyboxd x86_64 2.4.8-2.fc43 fedora 201.4 KiB gnupg2-verify x86_64 2.4.8-2.fc43 fedora 348.5 KiB gnutls x86_64 3.8.10-1.fc43 fedora 3.8 MiB go-srpm-macros noarch 3.7.0-1.fc43 fedora 61.6 KiB gpgverify noarch 2.2-2.fc43 fedora 8.7 KiB ima-evm-utils-libs x86_64 1.6.2-5.fc43 fedora 60.7 KiB jansson x86_64 2.14-2.fc42 fedora 93.1 KiB java-srpm-macros noarch 1-6.fc43 fedora 870.0 B json-c x86_64 0.18-4.fc43 fedora 82.7 KiB kernel-srpm-macros noarch 1.0-25.fc42 fedora 1.9 KiB keyutils-libs x86_64 1.6.3-5.fc42 fedora 58.3 KiB krb5-libs x86_64 1.21.3-6.fc43 fedora 2.3 MiB libacl x86_64 2.3.2-3.fc42 fedora 38.3 KiB libarchive x86_64 3.8.1-1.fc43 fedora 951.1 KiB libassuan x86_64 2.5.7-3.fc42 fedora 167.8 KiB libattr x86_64 2.5.2-5.fc42 fedora 27.1 KiB libblkid x86_64 2.41.1-11.fc43 fedora 262.4 KiB libbrotli x86_64 1.1.0-7.fc43 fedora 833.3 KiB libcap x86_64 2.76-1.fc43 fedora 209.2 KiB libcap-ng x86_64 0.8.5-5.fc43 fedora 68.9 KiB libcom_err x86_64 1.47.3-1.fc43 fedora 63.1 KiB libcurl x86_64 8.15.0-1.fc43 fedora 903.2 KiB libeconf x86_64 0.7.9-1.fc43 fedora 64.9 KiB libevent x86_64 2.1.12-15.fc42 fedora 903.1 KiB libfdisk x86_64 2.41.1-11.fc43 fedora 380.4 KiB libffi x86_64 3.5.1-1.fc43 fedora 83.6 KiB libfsverity x86_64 1.6-2.fc42 fedora 32.5 KiB libgcc x86_64 15.1.1-3.fc43 copr_base 266.6 KiB libgcrypt x86_64 1.11.1-1.fc43 fedora 1.6 MiB libgomp x86_64 15.1.1-3.fc43 copr_base 539.1 KiB libgpg-error x86_64 1.55-1.fc43 fedora 915.3 KiB libidn2 x86_64 2.3.8-1.fc43 fedora 552.5 KiB libksba x86_64 1.6.7-3.fc42 fedora 402.5 KiB liblastlog2 x86_64 2.41.1-11.fc43 fedora 33.9 KiB libmount x86_64 2.41.1-11.fc43 fedora 372.7 KiB libnghttp2 x86_64 1.66.0-1.fc43 fedora 162.2 KiB libpkgconf x86_64 2.3.0-2.fc42 fedora 78.1 KiB libpsl x86_64 0.21.5-5.fc42 fedora 76.4 KiB libselinux x86_64 3.9-1.fc43 fedora 193.1 KiB libsemanage x86_64 3.9-1.fc43 fedora 308.4 KiB libsepol x86_64 3.9-1.fc43 fedora 821.9 KiB libsmartcols x86_64 2.41.1-11.fc43 fedora 180.5 KiB libssh x86_64 0.11.2-1.fc43 fedora 566.7 KiB libssh-config noarch 0.11.2-1.fc43 fedora 277.0 B libstdc++ x86_64 15.1.1-3.fc43 copr_base 2.8 MiB libtasn1 x86_64 4.20.0-1.fc43 fedora 176.3 KiB libtool-ltdl x86_64 2.5.4-5.fc43 fedora 70.1 KiB libunistring x86_64 1.1-9.fc42 fedora 1.7 MiB libusb1 x86_64 1.0.28-2.fc43 fedora 171.0 KiB libuuid x86_64 2.41.1-11.fc43 fedora 37.4 KiB libverto x86_64 0.3.2-10.fc42 fedora 25.4 KiB libxcrypt x86_64 4.4.38-7.fc43 fedora 284.5 KiB libxml2 x86_64 2.12.10-2.fc43 fedora 1.7 MiB libzstd x86_64 1.5.7-1.fc43 fedora 807.8 KiB lua-libs x86_64 5.4.8-1.fc43 fedora 280.8 KiB lua-srpm-macros noarch 1-15.fc42 fedora 1.3 KiB lz4-libs x86_64 1.10.0-2.fc42 fedora 157.4 KiB mpfr x86_64 4.2.2-1.fc43 fedora 828.8 KiB ncurses-base noarch 6.5-6.20250614.fc43 fedora 328.1 KiB ncurses-libs x86_64 6.5-6.20250614.fc43 fedora 946.3 KiB nettle x86_64 3.10.1-1.fc43 fedora 790.5 KiB npth x86_64 1.8-2.fc42 fedora 49.6 KiB ocaml-srpm-macros noarch 10-4.fc42 fedora 1.9 KiB openblas-srpm-macros noarch 2-19.fc42 fedora 112.0 B openldap x86_64 2.6.10-2.fc43 fedora 655.8 KiB openssl-libs x86_64 1:3.5.1-1.fc43 fedora 8.9 MiB p11-kit x86_64 0.25.5-8.fc43 fedora 2.2 MiB p11-kit-trust x86_64 0.25.5-8.fc43 fedora 395.5 KiB package-notes-srpm-macros noarch 0.5-13.fc42 fedora 1.6 KiB pam-libs x86_64 1.7.1-2.fc43 fedora 126.8 KiB pcre2 x86_64 10.45-1.fc43 fedora 697.7 KiB pcre2-syntax noarch 10.45-1.fc43 fedora 273.9 KiB perl-srpm-macros noarch 1-59.fc43 fedora 861.0 B pkgconf x86_64 2.3.0-2.fc42 fedora 88.5 KiB pkgconf-m4 noarch 2.3.0-2.fc42 fedora 14.4 KiB pkgconf-pkg-config x86_64 2.3.0-2.fc42 fedora 989.0 B popt x86_64 1.19-8.fc42 fedora 132.8 KiB publicsuffix-list-dafsa noarch 20250616-1.fc43 fedora 69.1 KiB pyproject-srpm-macros noarch 1.18.3-1.fc43 fedora 1.9 KiB python-srpm-macros noarch 3.14-3.fc43 fedora 51.5 KiB qt5-srpm-macros noarch 5.15.17-1.fc43 fedora 500.0 B qt6-srpm-macros noarch 6.9.1-1.fc43 fedora 464.0 B readline x86_64 8.3-1.fc43 fedora 511.7 KiB rpm x86_64 5.99.91-1.fc43 fedora 3.0 MiB rpm-build-libs x86_64 5.99.91-1.fc43 fedora 268.4 KiB rpm-libs x86_64 5.99.91-1.fc43 fedora 933.7 KiB rpm-sequoia x86_64 1.9.0-1.fc43 fedora 2.5 MiB rpm-sign-libs x86_64 5.99.91-1.fc43 fedora 39.7 KiB rust-srpm-macros noarch 26.3-4.fc42 fedora 4.8 KiB setup noarch 2.15.0-25.fc43 fedora 725.0 KiB sqlite-libs x86_64 3.50.2-1.fc43 fedora 1.5 MiB systemd-libs x86_64 257.7-1.fc43 fedora 2.2 MiB systemd-standalone-sysusers x86_64 257.7-1.fc43 fedora 277.3 KiB tpm2-tss x86_64 4.1.3-7.fc43 fedora 1.6 MiB tree-sitter-srpm-macros noarch 0.4.1-1.fc43 fedora 8.2 KiB util-linux-core x86_64 2.41.1-11.fc43 fedora 1.5 MiB xxhash-libs x86_64 0.8.3-2.fc42 fedora 90.2 KiB xz-libs x86_64 1:5.8.1-1.fc43 fedora 217.8 KiB zig-srpm-macros noarch 1-4.fc42 fedora 1.1 KiB zip x86_64 3.0-43.fc42 fedora 698.5 KiB zlib-ng-compat x86_64 2.2.4-2.fc43 fedora 137.6 KiB zstd x86_64 1.5.7-1.fc43 fedora 1.7 MiB Installing groups: Buildsystem building group Transaction Summary: Installing: 169 packages Total size of inbound packages is 59 MiB. Need to download 59 MiB. After this operation, 198 MiB extra will be used (install 198 MiB, remove 0 B). [ 1/169] bzip2-0:1.0.8-20.fc42.x86_64 100% | 460.8 KiB/s | 52.1 KiB | 00m00s [ 2/169] cpio-0:2.15-2.fc41.x86_64 100% | 3.8 MiB/s | 291.8 KiB | 00m00s [ 3/169] bash-0:5.3.0-1.fc43.x86_64 100% | 8.1 MiB/s | 1.9 MiB | 00m00s [ 4/169] coreutils-0:9.7-4.fc43.x86_64 100% | 4.9 MiB/s | 1.1 MiB | 00m00s [ 5/169] diffutils-0:3.12-2.fc43.x86_6 100% | 7.8 MiB/s | 392.7 KiB | 00m00s [ 6/169] fedora-release-common-0:43-0. 100% | 1.2 MiB/s | 25.4 KiB | 00m00s [ 7/169] glibc-minimal-langpack-0:2.41 100% | 1.2 MiB/s | 35.2 KiB | 00m00s [ 8/169] findutils-1:4.10.0-5.fc42.x86 100% | 13.8 MiB/s | 551.5 KiB | 00m00s [ 9/169] grep-0:3.12-1.fc43.x86_64 100% | 9.1 MiB/s | 299.5 KiB | 00m00s [ 10/169] gzip-0:1.13-3.fc42.x86_64 100% | 5.0 MiB/s | 170.4 KiB | 00m00s [ 11/169] patch-0:2.8-1.fc43.x86_64 100% | 3.7 MiB/s | 113.7 KiB | 00m00s [ 12/169] redhat-rpm-config-0:343-7.fc4 100% | 3.5 MiB/s | 78.9 KiB | 00m00s [ 13/169] rpm-build-0:5.99.91-1.fc43.x8 100% | 6.0 MiB/s | 136.3 KiB | 00m00s [ 14/169] sed-0:4.9-4.fc42.x86_64 100% | 11.1 MiB/s | 317.3 KiB | 00m00s [ 15/169] info-0:7.2-4.fc43.x86_64 100% | 1.7 MiB/s | 182.8 KiB | 00m00s [ 16/169] tar-2:1.35-5.fc42.x86_64 100% | 19.6 MiB/s | 862.5 KiB | 00m00s [ 17/169] unzip-0:6.0-66.fc42.x86_64 100% | 7.5 MiB/s | 184.6 KiB | 00m00s [ 18/169] which-0:2.23-2.fc43.x86_64 100% | 1.6 MiB/s | 41.8 KiB | 00m00s [ 19/169] shadow-utils-2:4.18.0-1.fc43. 100% | 14.7 MiB/s | 1.3 MiB | 00m00s [ 20/169] xz-1:5.8.1-1.fc43.x86_64 100% | 17.5 MiB/s | 572.5 KiB | 00m00s [ 21/169] util-linux-0:2.41.1-11.fc43.x 100% | 27.1 MiB/s | 1.2 MiB | 00m00s [ 22/169] gawk-0:5.3.2-1.fc43.x86_64 100% | 16.1 MiB/s | 1.1 MiB | 00m00s [ 23/169] filesystem-0:3.18-44.fc43.x86 100% | 21.2 MiB/s | 1.3 MiB | 00m00s [ 24/169] glibc-0:2.41.9000-23.fc43.x86 100% | 45.8 MiB/s | 2.2 MiB | 00m00s [ 25/169] ncurses-libs-0:6.5-6.20250614 100% | 11.6 MiB/s | 333.1 KiB | 00m00s [ 26/169] bzip2-libs-0:1.0.8-20.fc42.x8 100% | 1.9 MiB/s | 43.6 KiB | 00m00s [ 27/169] coreutils-common-0:9.7-4.fc43 100% | 20.2 MiB/s | 2.1 MiB | 00m00s [ 28/169] libattr-0:2.5.2-5.fc42.x86_64 100% | 813.5 KiB/s | 17.1 KiB | 00m00s [ 29/169] gmp-1:6.3.0-3.fc43.x86_64 100% | 2.5 MiB/s | 322.2 KiB | 00m00s [ 30/169] libcap-0:2.76-1.fc43.x86_64 100% | 3.9 MiB/s | 86.9 KiB | 00m00s [ 31/169] libselinux-0:3.9-1.fc43.x86_6 100% | 4.0 MiB/s | 97.2 KiB | 00m00s [ 32/169] openssl-libs-1:3.5.1-1.fc43.x 100% | 44.3 MiB/s | 2.6 MiB | 00m00s [ 33/169] systemd-libs-0:257.7-1.fc43.x 100% | 13.1 MiB/s | 789.7 KiB | 00m00s [ 34/169] fedora-repos-0:43-0.2.noarch 100% | 384.6 KiB/s | 9.2 KiB | 00m00s [ 35/169] libacl-0:2.3.2-3.fc42.x86_64 100% | 97.9 KiB/s | 23.0 KiB | 00m00s [ 36/169] glibc-common-0:2.41.9000-23.f 100% | 9.3 MiB/s | 322.1 KiB | 00m00s [ 37/169] pcre2-0:10.45-1.fc43.x86_64 100% | 10.7 MiB/s | 262.8 KiB | 00m00s [ 38/169] ed-0:1.21.1-1.fc43.x86_64 100% | 3.6 MiB/s | 82.2 KiB | 00m00s [ 39/169] ansible-srpm-macros-0:1-17.1. 100% | 967.4 KiB/s | 20.3 KiB | 00m00s [ 40/169] build-reproducibility-srpm-ma 100% | 556.4 KiB/s | 11.7 KiB | 00m00s [ 41/169] dwz-0:0.16-1.fc43.x86_64 100% | 5.5 MiB/s | 135.5 KiB | 00m00s [ 42/169] efi-srpm-macros-0:6-3.fc43.no 100% | 1.0 MiB/s | 22.5 KiB | 00m00s [ 43/169] file-0:5.46-5.fc43.x86_64 100% | 2.3 MiB/s | 48.8 KiB | 00m00s [ 44/169] filesystem-srpm-macros-0:3.18 100% | 1.2 MiB/s | 26.0 KiB | 00m00s [ 45/169] fonts-srpm-macros-1:2.0.5-22. 100% | 1.3 MiB/s | 27.2 KiB | 00m00s [ 46/169] forge-srpm-macros-0:0.4.0-2.f 100% | 945.3 KiB/s | 19.9 KiB | 00m00s [ 47/169] fpc-srpm-macros-0:1.3-14.fc42 100% | 401.0 KiB/s | 8.0 KiB | 00m00s [ 48/169] ghc-srpm-macros-0:1.9.2-2.fc4 100% | 436.0 KiB/s | 9.2 KiB | 00m00s [ 49/169] gnat-srpm-macros-0:6-7.fc42.n 100% | 410.1 KiB/s | 8.6 KiB | 00m00s [ 50/169] go-srpm-macros-0:3.7.0-1.fc43 100% | 1.3 MiB/s | 27.9 KiB | 00m00s [ 51/169] java-srpm-macros-0:1-6.fc43.n 100% | 393.4 KiB/s | 7.9 KiB | 00m00s [ 52/169] kernel-srpm-macros-0:1.0-25.f 100% | 493.6 KiB/s | 9.9 KiB | 00m00s [ 53/169] lua-srpm-macros-0:1-15.fc42.n 100% | 424.6 KiB/s | 8.9 KiB | 00m00s [ 54/169] ocaml-srpm-macros-0:10-4.fc42 100% | 460.3 KiB/s | 9.2 KiB | 00m00s [ 55/169] openblas-srpm-macros-0:2-19.f 100% | 388.3 KiB/s | 7.8 KiB | 00m00s [ 56/169] package-notes-srpm-macros-0:0 100% | 440.9 KiB/s | 9.3 KiB | 00m00s [ 57/169] perl-srpm-macros-0:1-59.fc43. 100% | 423.1 KiB/s | 8.5 KiB | 00m00s [ 58/169] pyproject-srpm-macros-0:1.18. 100% | 578.7 KiB/s | 13.3 KiB | 00m00s [ 59/169] python-srpm-macros-0:3.14-3.f 100% | 1.1 MiB/s | 23.2 KiB | 00m00s [ 60/169] qt5-srpm-macros-0:5.15.17-1.f 100% | 435.9 KiB/s | 8.7 KiB | 00m00s [ 61/169] qt6-srpm-macros-0:6.9.1-1.fc4 100% | 375.4 KiB/s | 9.4 KiB | 00m00s [ 62/169] rust-srpm-macros-0:26.3-4.fc4 100% | 450.2 KiB/s | 11.7 KiB | 00m00s [ 63/169] rpm-0:5.99.91-1.fc43.x86_64 100% | 15.3 MiB/s | 563.4 KiB | 00m00s [ 64/169] tree-sitter-srpm-macros-0:0.4 100% | 620.4 KiB/s | 13.0 KiB | 00m00s [ 65/169] zig-srpm-macros-0:1-4.fc42.no 100% | 392.6 KiB/s | 8.2 KiB | 00m00s [ 66/169] zip-0:3.0-43.fc42.x86_64 100% | 9.9 MiB/s | 263.5 KiB | 00m00s [ 67/169] debugedit-0:5.2-1.fc43.x86_64 100% | 3.7 MiB/s | 80.6 KiB | 00m00s [ 68/169] elfutils-libelf-0:0.193-2.fc4 100% | 6.5 MiB/s | 207.9 KiB | 00m00s [ 69/169] libarchive-0:3.8.1-1.fc43.x86 100% | 12.5 MiB/s | 421.4 KiB | 00m00s [ 70/169] elfutils-0:0.193-2.fc43.x86_6 100% | 11.4 MiB/s | 571.5 KiB | 00m00s [ 71/169] popt-0:1.19-8.fc42.x86_64 100% | 2.9 MiB/s | 66.0 KiB | 00m00s [ 72/169] readline-0:8.3-1.fc43.x86_64 100% | 9.5 MiB/s | 224.7 KiB | 00m00s [ 73/169] rpm-build-libs-0:5.99.91-1.fc 100% | 4.8 MiB/s | 127.5 KiB | 00m00s [ 74/169] rpm-libs-0:5.99.91-1.fc43.x86 100% | 13.0 MiB/s | 399.9 KiB | 00m00s [ 75/169] zstd-0:1.5.7-1.fc43.x86_64 100% | 18.2 MiB/s | 485.8 KiB | 00m00s [ 76/169] audit-libs-0:4.1.0-1.fc43.x86 100% | 5.0 MiB/s | 138.3 KiB | 00m00s [ 77/169] libeconf-0:0.7.9-1.fc43.x86_6 100% | 1.6 MiB/s | 35.2 KiB | 00m00s [ 78/169] libsemanage-0:3.9-1.fc43.x86_ 100% | 5.5 MiB/s | 123.3 KiB | 00m00s [ 79/169] libxcrypt-0:4.4.38-7.fc43.x86 100% | 4.8 MiB/s | 127.2 KiB | 00m00s [ 80/169] pam-libs-0:1.7.1-2.fc43.x86_6 100% | 2.7 MiB/s | 57.7 KiB | 00m00s [ 81/169] setup-0:2.15.0-25.fc43.noarch 100% | 5.7 MiB/s | 157.6 KiB | 00m00s [ 82/169] xz-libs-1:5.8.1-1.fc43.x86_64 100% | 4.4 MiB/s | 113.0 KiB | 00m00s [ 83/169] mpfr-0:4.2.2-1.fc43.x86_64 100% | 12.1 MiB/s | 346.7 KiB | 00m00s [ 84/169] libblkid-0:2.41.1-11.fc43.x86 100% | 5.5 MiB/s | 124.1 KiB | 00m00s [ 85/169] libcap-ng-0:0.8.5-5.fc43.x86_ 100% | 1.5 MiB/s | 32.2 KiB | 00m00s [ 86/169] libfdisk-0:2.41.1-11.fc43.x86 100% | 6.6 MiB/s | 162.1 KiB | 00m00s [ 87/169] liblastlog2-0:2.41.1-11.fc43. 100% | 1.1 MiB/s | 24.0 KiB | 00m00s [ 88/169] libmount-0:2.41.1-11.fc43.x86 100% | 5.5 MiB/s | 163.3 KiB | 00m00s [ 89/169] libuuid-0:2.41.1-11.fc43.x86_ 100% | 1.3 MiB/s | 27.0 KiB | 00m00s [ 90/169] libsmartcols-0:2.41.1-11.fc43 100% | 3.8 MiB/s | 84.9 KiB | 00m00s [ 91/169] zlib-ng-compat-0:2.2.4-2.fc43 100% | 3.4 MiB/s | 79.1 KiB | 00m00s [ 92/169] util-linux-core-0:2.41.1-11.f 100% | 11.2 MiB/s | 551.7 KiB | 00m00s [ 93/169] ncurses-base-0:6.5-6.20250614 100% | 3.9 MiB/s | 88.3 KiB | 00m00s [ 94/169] glibc-gconv-extra-0:2.41.9000 100% | 29.3 MiB/s | 1.6 MiB | 00m00s [ 95/169] crypto-policies-0:20250714-1. 100% | 3.7 MiB/s | 98.6 KiB | 00m00s [ 96/169] ca-certificates-0:2024.2.69_v 100% | 25.6 MiB/s | 945.0 KiB | 00m00s [ 97/169] libsepol-0:3.9-1.fc43.x86_64 100% | 8.4 MiB/s | 345.4 KiB | 00m00s [ 98/169] fedora-gpg-keys-0:43-0.2.noar 100% | 5.3 MiB/s | 136.6 KiB | 00m00s [ 99/169] fedora-repos-rawhide-0:43-0.2 100% | 366.8 KiB/s | 8.8 KiB | 00m00s [100/169] pcre2-syntax-0:10.45-1.fc43.n 100% | 5.6 MiB/s | 161.7 KiB | 00m00s [101/169] add-determinism-0:0.6.0-1.fc4 100% | 24.2 MiB/s | 918.3 KiB | 00m00s [102/169] file-libs-0:5.46-5.fc43.x86_6 100% | 19.8 MiB/s | 849.8 KiB | 00m00s [103/169] curl-0:8.15.0-1.fc43.x86_64 100% | 6.5 MiB/s | 233.8 KiB | 00m00s [104/169] elfutils-libs-0:0.193-2.fc43. 100% | 10.6 MiB/s | 270.2 KiB | 00m00s [105/169] elfutils-debuginfod-client-0: 100% | 2.1 MiB/s | 47.0 KiB | 00m00s [106/169] libzstd-0:1.5.7-1.fc43.x86_64 100% | 11.4 MiB/s | 314.8 KiB | 00m00s [107/169] lz4-libs-0:1.10.0-2.fc42.x86_ 100% | 3.0 MiB/s | 78.1 KiB | 00m00s [108/169] libxml2-0:2.12.10-2.fc43.x86_ 100% | 22.5 MiB/s | 691.3 KiB | 00m00s [109/169] lua-libs-0:5.4.8-1.fc43.x86_6 100% | 5.6 MiB/s | 131.9 KiB | 00m00s [110/169] rpm-sign-libs-0:5.99.91-1.fc4 100% | 1.3 MiB/s | 28.2 KiB | 00m00s [111/169] elfutils-default-yama-scope-0 100% | 419.5 KiB/s | 12.6 KiB | 00m00s [112/169] sqlite-libs-0:3.50.2-1.fc43.x 100% | 10.6 MiB/s | 761.3 KiB | 00m00s [113/169] json-c-0:0.18-4.fc43.x86_64 100% | 1.9 MiB/s | 44.7 KiB | 00m00s [114/169] ima-evm-utils-libs-0:1.6.2-5. 100% | 1.2 MiB/s | 29.5 KiB | 00m00s [115/169] libfsverity-0:1.6-2.fc42.x86_ 100% | 626.1 KiB/s | 18.8 KiB | 00m00s [116/169] gnupg2-0:2.4.8-2.fc43.x86_64 100% | 18.7 MiB/s | 1.6 MiB | 00m00s [117/169] gpgverify-0:2.2-2.fc43.noarch 100% | 364.1 KiB/s | 10.9 KiB | 00m00s [118/169] gnupg2-dirmngr-0:2.4.8-2.fc43 100% | 8.9 MiB/s | 274.8 KiB | 00m00s [119/169] gnupg2-gpg-agent-0:2.4.8-2.fc 100% | 6.8 MiB/s | 273.0 KiB | 00m00s [120/169] gnupg2-gpgconf-0:2.4.8-2.fc43 100% | 4.7 MiB/s | 115.2 KiB | 00m00s [121/169] gnupg2-keyboxd-0:2.4.8-2.fc43 100% | 3.9 MiB/s | 94.8 KiB | 00m00s [122/169] gnupg2-verify-0:2.4.8-2.fc43. 100% | 6.7 MiB/s | 171.3 KiB | 00m00s [123/169] libassuan-0:2.5.7-3.fc42.x86_ 100% | 2.9 MiB/s | 67.6 KiB | 00m00s [124/169] libgcrypt-0:1.11.1-1.fc43.x86 100% | 15.3 MiB/s | 596.1 KiB | 00m00s [125/169] libgpg-error-0:1.55-1.fc43.x8 100% | 6.4 MiB/s | 244.1 KiB | 00m00s [126/169] npth-0:1.8-2.fc42.x86_64 100% | 1.2 MiB/s | 25.8 KiB | 00m00s [127/169] tpm2-tss-0:4.1.3-7.fc43.x86_6 100% | 9.2 MiB/s | 423.4 KiB | 00m00s [128/169] gnutls-0:3.8.10-1.fc43.x86_64 100% | 28.6 MiB/s | 1.4 MiB | 00m00s [129/169] libksba-0:1.6.7-3.fc42.x86_64 100% | 5.3 MiB/s | 162.0 KiB | 00m00s [130/169] openldap-0:2.6.10-2.fc43.x86_ 100% | 10.1 MiB/s | 259.1 KiB | 00m00s [131/169] libusb1-0:1.0.28-2.fc43.x86_6 100% | 3.2 MiB/s | 79.3 KiB | 00m00s [132/169] libidn2-0:2.3.8-1.fc43.x86_64 100% | 7.4 MiB/s | 174.8 KiB | 00m00s [133/169] libtasn1-0:4.20.0-1.fc43.x86_ 100% | 3.1 MiB/s | 75.0 KiB | 00m00s [134/169] libunistring-0:1.1-9.fc42.x86 100% | 17.7 MiB/s | 542.5 KiB | 00m00s [135/169] nettle-0:3.10.1-1.fc43.x86_64 100% | 9.9 MiB/s | 424.6 KiB | 00m00s [136/169] p11-kit-0:0.25.5-8.fc43.x86_6 100% | 14.4 MiB/s | 488.2 KiB | 00m00s [137/169] rpm-sequoia-0:1.9.0-1.fc43.x8 100% | 1.9 MiB/s | 932.9 KiB | 00m00s [138/169] libevent-0:2.1.12-15.fc42.x86 100% | 10.2 MiB/s | 260.2 KiB | 00m00s [139/169] cyrus-sasl-lib-0:2.1.28-30.fc 100% | 13.4 MiB/s | 793.5 KiB | 00m00s [140/169] libffi-0:3.5.1-1.fc43.x86_64 100% | 1.9 MiB/s | 40.9 KiB | 00m00s [141/169] gdbm-libs-1:1.23-9.fc42.x86_6 100% | 2.3 MiB/s | 57.0 KiB | 00m00s [142/169] libgcc-0:15.1.1-3.fc43.x86_64 100% | 2.3 MiB/s | 129.5 KiB | 00m00s [143/169] p11-kit-trust-0:0.25.5-8.fc43 100% | 5.6 MiB/s | 132.4 KiB | 00m00s [144/169] alternatives-0:1.33-1.fc43.x8 100% | 1.9 MiB/s | 40.5 KiB | 00m00s [145/169] jansson-0:2.14-2.fc42.x86_64 100% | 2.0 MiB/s | 45.7 KiB | 00m00s [146/169] pkgconf-pkg-config-0:2.3.0-2. 100% | 472.6 KiB/s | 9.9 KiB | 00m00s [147/169] pkgconf-0:2.3.0-2.fc42.x86_64 100% | 2.1 MiB/s | 44.9 KiB | 00m00s [148/169] pkgconf-m4-0:2.3.0-2.fc42.noa 100% | 677.9 KiB/s | 14.2 KiB | 00m00s [149/169] libpkgconf-0:2.3.0-2.fc42.x86 100% | 1.6 MiB/s | 38.4 KiB | 00m00s [150/169] binutils-0:2.44.90-2.fc43.x86 100% | 24.4 MiB/s | 5.8 MiB | 00m00s [151/169] libstdc++-0:15.1.1-3.fc43.x86 100% | 16.9 MiB/s | 916.6 KiB | 00m00s [152/169] libgomp-0:15.1.1-3.fc43.x86_6 100% | 17.9 MiB/s | 367.4 KiB | 00m00s [153/169] fedora-release-0:43-0.19.noar 100% | 682.3 KiB/s | 14.3 KiB | 00m00s [154/169] systemd-standalone-sysusers-0 100% | 5.7 MiB/s | 134.8 KiB | 00m00s [155/169] libtool-ltdl-0:2.5.4-5.fc43.x 100% | 104.8 KiB/s | 36.2 KiB | 00m00s [156/169] xxhash-libs-0:0.8.3-2.fc42.x8 100% | 1.8 MiB/s | 39.1 KiB | 00m00s [157/169] libcurl-0:8.15.0-1.fc43.x86_6 100% | 11.6 MiB/s | 404.5 KiB | 00m00s [158/169] fedora-release-identity-basic 100% | 181.9 KiB/s | 15.1 KiB | 00m00s [159/169] krb5-libs-0:1.21.3-6.fc43.x86 100% | 18.1 MiB/s | 759.5 KiB | 00m00s [160/169] libnghttp2-0:1.66.0-1.fc43.x8 100% | 3.0 MiB/s | 72.7 KiB | 00m00s [161/169] gdb-minimal-0:16.3-3.fc43.x86 100% | 29.2 MiB/s | 4.4 MiB | 00m00s [162/169] libpsl-0:0.21.5-5.fc42.x86_64 100% | 2.6 MiB/s | 64.0 KiB | 00m00s [163/169] libssh-0:0.11.2-1.fc43.x86_64 100% | 8.7 MiB/s | 232.8 KiB | 00m00s [164/169] keyutils-libs-0:1.6.3-5.fc42. 100% | 1.5 MiB/s | 31.5 KiB | 00m00s [165/169] libcom_err-0:1.47.3-1.fc43.x8 100% | 1.2 MiB/s | 26.8 KiB | 00m00s [166/169] libverto-0:0.3.2-10.fc42.x86_ 100% | 990.5 KiB/s | 20.8 KiB | 00m00s [167/169] publicsuffix-list-dafsa-0:202 100% | 2.6 MiB/s | 59.2 KiB | 00m00s [168/169] libssh-config-0:0.11.2-1.fc43 100% | 442.6 KiB/s | 8.9 KiB | 00m00s [169/169] libbrotli-0:1.1.0-7.fc43.x86_ 100% | 792.3 KiB/s | 339.1 KiB | 00m00s -------------------------------------------------------------------------------- [169/169] Total 100% | 21.3 MiB/s | 58.8 MiB | 00m03s Running transaction Importing OpenPGP key 0x31645531: UserID : "Fedora (43) " Fingerprint: C6E7F081CF80E13146676E88829B606631645531 From : file:///usr/share/distribution-gpg-keys/fedora/RPM-GPG-KEY-fedora-43-primary The key was successfully imported. Importing OpenPGP key 0x31645531: UserID : "Fedora (43) " Fingerprint: C6E7F081CF80E13146676E88829B606631645531 From : file:///usr/share/distribution-gpg-keys/fedora/RPM-GPG-KEY-fedora-43-primary The key was successfully imported. Importing OpenPGP key 0x105EF944: UserID : "Fedora (42) " Fingerprint: B0F4950458F69E1150C6C5EDC8AC4916105EF944 From : file:///usr/share/distribution-gpg-keys/fedora/RPM-GPG-KEY-fedora-42-primary The key was successfully imported. Importing OpenPGP key 0x6D9F90A6: UserID : "Fedora (44) " Fingerprint: 36F612DCF27F7D1A48A835E4DBFCF71C6D9F90A6 From : file:///usr/share/distribution-gpg-keys/fedora/RPM-GPG-KEY-fedora-44-primary The key was successfully imported. [ 1/171] Verify package files 100% | 681.0 B/s | 169.0 B | 00m00s >>> Running %pretrans scriptlet: filesystem-0:3.18-44.fc43.x86_64 >>> Finished %pretrans scriptlet: filesystem-0:3.18-44.fc43.x86_64 >>> [RPM] /var/lib/mock/fedora-rawhide-x86_64-1753289447.166372/root/var/cache/d [ 2/171] Prepare transaction 100% | 1.9 KiB/s | 169.0 B | 00m00s [ 3/171] Installing libgcc-0:15.1.1-3. 100% | 131.0 MiB/s | 268.3 KiB | 00m00s [ 4/171] Installing libssh-config-0:0. 100% | 0.0 B/s | 816.0 B | 00m00s [ 5/171] Installing publicsuffix-list- 100% | 68.2 MiB/s | 69.8 KiB | 00m00s [ 6/171] Installing fedora-release-ide 100% | 898.4 KiB/s | 920.0 B | 00m00s [ 7/171] Installing fedora-gpg-keys-0: 100% | 19.1 MiB/s | 175.9 KiB | 00m00s [ 8/171] Installing fedora-repos-rawhi 100% | 0.0 B/s | 2.4 KiB | 00m00s [ 9/171] Installing fedora-repos-0:43- 100% | 5.6 MiB/s | 5.7 KiB | 00m00s [ 10/171] Installing fedora-release-com 100% | 12.1 MiB/s | 24.8 KiB | 00m00s [ 11/171] Installing fedora-release-0:4 100% | 8.1 KiB/s | 124.0 B | 00m00s >>> Running sysusers scriptlet: setup-0:2.15.0-25.fc43.noarch >>> Finished sysusers scriptlet: setup-0:2.15.0-25.fc43.noarch >>> Scriptlet output: >>> Creating group 'adm' with GID 4. >>> Creating group 'audio' with GID 63. >>> Creating group 'cdrom' with GID 11. >>> Creating group 'clock' with GID 103. >>> Creating group 'dialout' with GID 18. >>> Creating group 'disk' with GID 6. >>> Creating group 'floppy' with GID 19. >>> Creating group 'ftp' with GID 50. >>> Creating group 'games' with GID 20. >>> Creating group 'input' with GID 104. >>> Creating group 'kmem' with GID 9. >>> Creating group 'kvm' with GID 36. >>> Creating group 'lock' with GID 54. >>> Creating group 'lp' with GID 7. >>> Creating group 'mail' with GID 12. >>> Creating group 'man' with GID 15. >>> Creating group 'mem' with GID 8. >>> Creating group 'nobody' with GID 65534. >>> Creating group 'render' with GID 105. >>> Creating group 'root' with GID 0. >>> Creating group 'sgx' with GID 106. >>> Creating group 'sys' with GID 3. >>> Creating group 'tape' with GID 33. >>> Creating group 'tty' with GID 5. >>> Creating group 'users' with GID 100. >>> Creating group 'utmp' with GID 22. >>> Creating group 'video' with GID 39. >>> Creating group 'wheel' with GID 10. >>> Creating user 'adm' (adm) with UID 3 and GID 4. >>> Creating group 'bin' with GID 1. >>> Creating user 'bin' (bin) with UID 1 and GID 1. >>> Creating group 'daemon' with GID 2. >>> Creating user 'daemon' (daemon) with UID 2 and GID 2. >>> Creating user 'ftp' (FTP User) with UID 14 and GID 50. >>> Creating user 'games' (games) with UID 12 and GID 100. >>> Creating user 'halt' (halt) with UID 7 and GID 0. >>> Creating user 'lp' (lp) with UID 4 and GID 7. >>> Creating user 'mail' (mail) with UID 8 and GID 12. >>> Creating user 'nobody' (Kernel Overflow User) with UID 65534 and GID 65534. >>> Creating user 'operator' (operator) with UID 11 and GID 0. >>> Creating user 'root' (Super User) with UID 0 and GID 0. >>> Creating user 'shutdown' (shutdown) with UID 6 and GID 0. >>> Creating user 'sync' (sync) with UID 5 and GID 0. >>> [ 12/171] Installing setup-0:2.15.0-25. 100% | 34.0 MiB/s | 730.6 KiB | 00m00s >>> [RPM] /etc/hosts created as /etc/hosts.rpmnew [ 13/171] Installing filesystem-0:3.18- 100% | 1.4 MiB/s | 212.5 KiB | 00m00s [ 14/171] Installing pkgconf-m4-0:2.3.0 100% | 14.5 MiB/s | 14.8 KiB | 00m00s [ 15/171] Installing pcre2-syntax-0:10. 100% | 135.0 MiB/s | 276.4 KiB | 00m00s [ 16/171] Installing ncurses-base-0:6.5 100% | 34.5 MiB/s | 353.5 KiB | 00m00s [ 17/171] Installing bash-0:5.3.0-1.fc4 100% | 196.1 MiB/s | 8.4 MiB | 00m00s [ 18/171] Installing glibc-common-0:2.4 100% | 48.6 MiB/s | 1.0 MiB | 00m00s [ 19/171] Installing glibc-gconv-extra- 100% | 143.4 MiB/s | 7.3 MiB | 00m00s [ 20/171] Installing glibc-0:2.41.9000- 100% | 142.4 MiB/s | 6.7 MiB | 00m00s [ 21/171] Installing ncurses-libs-0:6.5 100% | 155.1 MiB/s | 952.9 KiB | 00m00s [ 22/171] Installing glibc-minimal-lang 100% | 0.0 B/s | 124.0 B | 00m00s [ 23/171] Installing zlib-ng-compat-0:2 100% | 135.2 MiB/s | 138.4 KiB | 00m00s [ 24/171] Installing bzip2-libs-0:1.0.8 100% | 83.7 MiB/s | 85.7 KiB | 00m00s [ 25/171] Installing libgpg-error-0:1.5 100% | 50.0 MiB/s | 921.1 KiB | 00m00s [ 26/171] Installing libstdc++-0:15.1.1 100% | 258.6 MiB/s | 2.8 MiB | 00m00s [ 27/171] Installing xz-libs-1:5.8.1-1. 100% | 213.8 MiB/s | 218.9 KiB | 00m00s [ 28/171] Installing libassuan-0:2.5.7- 100% | 165.6 MiB/s | 169.6 KiB | 00m00s [ 29/171] Installing libgcrypt-0:1.11.1 100% | 262.5 MiB/s | 1.6 MiB | 00m00s [ 30/171] Installing readline-0:8.3-1.f 100% | 167.3 MiB/s | 513.9 KiB | 00m00s [ 31/171] Installing gmp-1:6.3.0-3.fc43 100% | 267.4 MiB/s | 821.5 KiB | 00m00s [ 32/171] Installing libuuid-0:2.41.1-1 100% | 37.4 MiB/s | 38.3 KiB | 00m00s [ 33/171] Installing popt-0:1.19-8.fc42 100% | 34.0 MiB/s | 139.4 KiB | 00m00s [ 34/171] Installing npth-0:1.8-2.fc42. 100% | 49.5 MiB/s | 50.7 KiB | 00m00s [ 35/171] Installing libblkid-0:2.41.1- 100% | 128.7 MiB/s | 263.5 KiB | 00m00s [ 36/171] Installing libxcrypt-0:4.4.38 100% | 140.2 MiB/s | 287.2 KiB | 00m00s [ 37/171] Installing libzstd-0:1.5.7-1. 100% | 263.4 MiB/s | 809.1 KiB | 00m00s [ 38/171] Installing elfutils-libelf-0: 100% | 233.3 MiB/s | 1.2 MiB | 00m00s [ 39/171] Installing sqlite-libs-0:3.50 100% | 252.7 MiB/s | 1.5 MiB | 00m00s [ 40/171] Installing gnupg2-gpgconf-0:2 100% | 18.9 MiB/s | 252.1 KiB | 00m00s [ 41/171] Installing libattr-0:2.5.2-5. 100% | 27.4 MiB/s | 28.1 KiB | 00m00s [ 42/171] Installing libacl-0:2.3.2-3.f 100% | 38.2 MiB/s | 39.2 KiB | 00m00s [ 43/171] Installing libtasn1-0:4.20.0- 100% | 87.0 MiB/s | 178.1 KiB | 00m00s [ 44/171] Installing libunistring-0:1.1 100% | 246.7 MiB/s | 1.7 MiB | 00m00s [ 45/171] Installing libidn2-0:2.3.8-1. 100% | 30.3 MiB/s | 558.7 KiB | 00m00s [ 46/171] Installing crypto-policies-0: 100% | 15.3 MiB/s | 172.0 KiB | 00m00s [ 47/171] Installing dwz-0:0.16-1.fc43. 100% | 18.8 MiB/s | 288.5 KiB | 00m00s [ 48/171] Installing gnupg2-verify-0:2. 100% | 24.4 MiB/s | 349.9 KiB | 00m00s [ 49/171] Installing mpfr-0:4.2.2-1.fc4 100% | 202.7 MiB/s | 830.4 KiB | 00m00s [ 50/171] Installing gawk-0:5.3.2-1.fc4 100% | 82.5 MiB/s | 1.8 MiB | 00m00s [ 51/171] Installing libksba-0:1.6.7-3. 100% | 131.9 MiB/s | 405.1 KiB | 00m00s [ 52/171] Installing unzip-0:6.0-66.fc4 100% | 27.5 MiB/s | 393.8 KiB | 00m00s [ 53/171] Installing file-libs-0:5.46-5 100% | 474.3 MiB/s | 11.9 MiB | 00m00s [ 54/171] Installing file-0:5.46-5.fc43 100% | 7.6 MiB/s | 101.7 KiB | 00m00s [ 55/171] Installing pcre2-0:10.45-1.fc 100% | 227.6 MiB/s | 699.1 KiB | 00m00s [ 56/171] Installing grep-0:3.12-1.fc43 100% | 50.1 MiB/s | 1.0 MiB | 00m00s [ 57/171] Installing xz-1:5.8.1-1.fc43. 100% | 57.9 MiB/s | 1.3 MiB | 00m00s [ 58/171] Installing libeconf-0:0.7.9-1 100% | 65.0 MiB/s | 66.5 KiB | 00m00s [ 59/171] Installing libcap-ng-0:0.8.5- 100% | 69.2 MiB/s | 70.8 KiB | 00m00s [ 60/171] Installing audit-libs-0:4.1.0 100% | 124.2 MiB/s | 381.5 KiB | 00m00s [ 61/171] Installing pam-libs-0:1.7.1-2 100% | 63.1 MiB/s | 129.2 KiB | 00m00s [ 62/171] Installing libcap-0:2.76-1.fc 100% | 14.9 MiB/s | 214.3 KiB | 00m00s [ 63/171] Installing systemd-libs-0:257 100% | 248.0 MiB/s | 2.2 MiB | 00m00s [ 64/171] Installing libsmartcols-0:2.4 100% | 177.4 MiB/s | 181.6 KiB | 00m00s [ 65/171] Installing libsepol-0:3.9-1.f 100% | 200.9 MiB/s | 822.9 KiB | 00m00s [ 66/171] Installing libselinux-0:3.9-1 100% | 94.9 MiB/s | 194.3 KiB | 00m00s [ 67/171] Installing findutils-1:4.10.0 100% | 85.2 MiB/s | 1.9 MiB | 00m00s [ 68/171] Installing sed-0:4.9-4.fc42.x 100% | 42.3 MiB/s | 865.5 KiB | 00m00s [ 69/171] Installing libmount-0:2.41.1- 100% | 182.5 MiB/s | 373.8 KiB | 00m00s [ 70/171] Installing lz4-libs-0:1.10.0- 100% | 154.7 MiB/s | 158.5 KiB | 00m00s [ 71/171] Installing lua-libs-0:5.4.8-1 100% | 137.7 MiB/s | 282.0 KiB | 00m00s [ 72/171] Installing json-c-0:0.18-4.fc 100% | 82.0 MiB/s | 84.0 KiB | 00m00s [ 73/171] Installing libffi-0:3.5.1-1.f 100% | 83.0 MiB/s | 85.0 KiB | 00m00s [ 74/171] Installing p11-kit-0:0.25.5-8 100% | 84.0 MiB/s | 2.2 MiB | 00m00s [ 75/171] Installing alternatives-0:1.3 100% | 4.8 MiB/s | 63.8 KiB | 00m00s [ 76/171] Installing p11-kit-trust-0:0. 100% | 13.8 MiB/s | 397.1 KiB | 00m00s [ 77/171] Installing zstd-0:1.5.7-1.fc4 100% | 90.0 MiB/s | 1.7 MiB | 00m00s [ 78/171] Installing util-linux-core-0: 100% | 61.6 MiB/s | 1.5 MiB | 00m00s [ 79/171] Installing tar-2:1.35-5.fc42. 100% | 113.9 MiB/s | 3.0 MiB | 00m00s [ 80/171] Installing libsemanage-0:3.9- 100% | 151.5 MiB/s | 310.2 KiB | 00m00s [ 81/171] Installing systemd-standalone 100% | 20.9 MiB/s | 277.8 KiB | 00m00s [ 82/171] Installing libusb1-0:1.0.28-2 100% | 84.3 MiB/s | 172.7 KiB | 00m00s [ 83/171] Installing zip-0:3.0-43.fc42. 100% | 45.7 MiB/s | 702.4 KiB | 00m00s [ 84/171] Installing gnupg2-keyboxd-0:2 100% | 14.1 MiB/s | 202.7 KiB | 00m00s [ 85/171] Installing libpsl-0:0.21.5-5. 100% | 75.7 MiB/s | 77.5 KiB | 00m00s [ 86/171] Installing liblastlog2-0:2.41 100% | 2.7 MiB/s | 35.9 KiB | 00m00s [ 87/171] Installing libfdisk-0:2.41.1- 100% | 124.2 MiB/s | 381.5 KiB | 00m00s [ 88/171] Installing nettle-0:3.10.1-1. 100% | 155.0 MiB/s | 793.6 KiB | 00m00s [ 89/171] Installing gnutls-0:3.8.10-1. 100% | 240.0 MiB/s | 3.8 MiB | 00m00s [ 90/171] Installing libxml2-0:2.12.10- 100% | 85.2 MiB/s | 1.7 MiB | 00m00s [ 91/171] Installing bzip2-0:1.0.8-20.f 100% | 7.8 MiB/s | 103.8 KiB | 00m00s [ 92/171] Installing add-determinism-0: 100% | 117.4 MiB/s | 2.5 MiB | 00m00s [ 93/171] Installing build-reproducibil 100% | 1.0 MiB/s | 1.0 KiB | 00m00s [ 94/171] Installing cpio-0:2.15-2.fc41 100% | 57.9 MiB/s | 1.1 MiB | 00m00s [ 95/171] Installing diffutils-0:3.12-2 100% | 74.3 MiB/s | 1.6 MiB | 00m00s [ 96/171] Installing ed-0:1.21.1-1.fc43 100% | 10.9 MiB/s | 145.1 KiB | 00m00s [ 97/171] Installing patch-0:2.8-1.fc43 100% | 17.2 MiB/s | 228.3 KiB | 00m00s [ 98/171] Installing libtool-ltdl-0:2.5 100% | 69.6 MiB/s | 71.2 KiB | 00m00s [ 99/171] Installing gdbm-libs-1:1.23-9 100% | 128.5 MiB/s | 131.6 KiB | 00m00s [100/171] Installing cyrus-sasl-lib-0:2 100% | 109.7 MiB/s | 2.3 MiB | 00m00s [101/171] Installing jansson-0:2.14-2.f 100% | 92.2 MiB/s | 94.4 KiB | 00m00s [102/171] Installing libpkgconf-0:2.3.0 100% | 77.4 MiB/s | 79.2 KiB | 00m00s [103/171] Installing pkgconf-0:2.3.0-2. 100% | 6.3 MiB/s | 91.0 KiB | 00m00s [104/171] Installing pkgconf-pkg-config 100% | 147.8 KiB/s | 1.8 KiB | 00m00s [105/171] Installing libgomp-0:15.1.1-3 100% | 263.9 MiB/s | 540.4 KiB | 00m00s [106/171] Installing xxhash-libs-0:0.8. 100% | 89.4 MiB/s | 91.6 KiB | 00m00s [107/171] Installing libbrotli-0:1.1.0- 100% | 204.0 MiB/s | 835.6 KiB | 00m00s [108/171] Installing libnghttp2-0:1.66. 100% | 159.5 MiB/s | 163.3 KiB | 00m00s [109/171] Installing keyutils-libs-0:1. 100% | 58.3 MiB/s | 59.7 KiB | 00m00s [110/171] Installing libcom_err-0:1.47. 100% | 62.7 MiB/s | 64.2 KiB | 00m00s [111/171] Installing libverto-0:0.3.2-1 100% | 26.6 MiB/s | 27.2 KiB | 00m00s [112/171] Installing filesystem-srpm-ma 100% | 38.0 MiB/s | 38.9 KiB | 00m00s [113/171] Installing elfutils-default-y 100% | 170.2 KiB/s | 2.0 KiB | 00m00s [114/171] Installing elfutils-libs-0:0. 100% | 167.3 MiB/s | 685.2 KiB | 00m00s [115/171] Installing rust-srpm-macros-0 100% | 5.4 MiB/s | 5.6 KiB | 00m00s [116/171] Installing qt6-srpm-macros-0: 100% | 0.0 B/s | 740.0 B | 00m00s [117/171] Installing qt5-srpm-macros-0: 100% | 0.0 B/s | 776.0 B | 00m00s [118/171] Installing perl-srpm-macros-0 100% | 0.0 B/s | 1.1 KiB | 00m00s [119/171] Installing package-notes-srpm 100% | 2.0 MiB/s | 2.0 KiB | 00m00s [120/171] Installing openblas-srpm-macr 100% | 0.0 B/s | 392.0 B | 00m00s [121/171] Installing ocaml-srpm-macros- 100% | 0.0 B/s | 2.2 KiB | 00m00s [122/171] Installing kernel-srpm-macros 100% | 0.0 B/s | 2.3 KiB | 00m00s [123/171] Installing gnat-srpm-macros-0 100% | 0.0 B/s | 1.3 KiB | 00m00s [124/171] Installing ghc-srpm-macros-0: 100% | 0.0 B/s | 1.0 KiB | 00m00s [125/171] Installing fpc-srpm-macros-0: 100% | 0.0 B/s | 420.0 B | 00m00s [126/171] Installing ansible-srpm-macro 100% | 35.4 MiB/s | 36.2 KiB | 00m00s [127/171] Installing coreutils-common-0 100% | 245.5 MiB/s | 11.3 MiB | 00m00s [128/171] Installing openssl-libs-1:3.5 100% | 307.0 MiB/s | 8.9 MiB | 00m00s [129/171] Installing coreutils-0:9.7-4. 100% | 104.7 MiB/s | 5.4 MiB | 00m00s [130/171] Installing ca-certificates-0: 100% | 1.2 MiB/s | 2.4 MiB | 00m02s [131/171] Installing libarchive-0:3.8.1 100% | 186.1 MiB/s | 953.1 KiB | 00m00s [132/171] Installing krb5-libs-0:1.21.3 100% | 88.1 MiB/s | 2.3 MiB | 00m00s >>> Running sysusers scriptlet: tpm2-tss-0:4.1.3-7.fc43.x86_64 >>> Finished sysusers scriptlet: tpm2-tss-0:4.1.3-7.fc43.x86_64 >>> Scriptlet output: >>> Creating group 'tss' with GID 59. >>> Creating user 'tss' (Account used for TPM access) with UID 59 and GID 59. >>> [133/171] Installing tpm2-tss-0:4.1.3-7 100% | 174.2 MiB/s | 1.6 MiB | 00m00s [134/171] Installing ima-evm-utils-libs 100% | 60.5 MiB/s | 62.0 KiB | 00m00s [135/171] Installing gnupg2-gpg-agent-0 100% | 21.3 MiB/s | 675.4 KiB | 00m00s [136/171] Installing libssh-0:0.11.2-1. 100% | 138.9 MiB/s | 568.8 KiB | 00m00s [137/171] Installing gzip-0:1.13-3.fc42 100% | 24.3 MiB/s | 398.4 KiB | 00m00s [138/171] Installing rpm-sequoia-0:1.9. 100% | 275.4 MiB/s | 2.5 MiB | 00m00s [139/171] Installing rpm-libs-0:5.99.91 100% | 228.3 MiB/s | 935.3 KiB | 00m00s [140/171] Installing libfsverity-0:1.6- 100% | 32.7 MiB/s | 33.5 KiB | 00m00s [141/171] Installing libevent-0:2.1.12- 100% | 221.4 MiB/s | 906.9 KiB | 00m00s [142/171] Installing openldap-0:2.6.10- 100% | 161.0 MiB/s | 659.6 KiB | 00m00s [143/171] Installing libcurl-0:8.15.0-1 100% | 220.8 MiB/s | 904.3 KiB | 00m00s [144/171] Installing elfutils-debuginfo 100% | 6.0 MiB/s | 86.2 KiB | 00m00s [145/171] Installing elfutils-0:0.193-2 100% | 121.8 MiB/s | 2.9 MiB | 00m00s [146/171] Installing binutils-0:2.44.90 100% | 229.9 MiB/s | 26.4 MiB | 00m00s [147/171] Installing gdb-minimal-0:16.3 100% | 236.6 MiB/s | 13.2 MiB | 00m00s [148/171] Installing debugedit-0:5.2-1. 100% | 13.1 MiB/s | 200.5 KiB | 00m00s [149/171] Installing curl-0:8.15.0-1.fc 100% | 15.0 MiB/s | 476.3 KiB | 00m00s [150/171] Installing rpm-0:5.99.91-1.fc 100% | 45.3 MiB/s | 2.5 MiB | 00m00s [151/171] Installing efi-srpm-macros-0: 100% | 40.2 MiB/s | 41.1 KiB | 00m00s [152/171] Installing java-srpm-macros-0 100% | 0.0 B/s | 1.1 KiB | 00m00s [153/171] Installing lua-srpm-macros-0: 100% | 1.9 MiB/s | 1.9 KiB | 00m00s [154/171] Installing tree-sitter-srpm-m 100% | 9.0 MiB/s | 9.3 KiB | 00m00s [155/171] Installing zig-srpm-macros-0: 100% | 1.6 MiB/s | 1.7 KiB | 00m00s [156/171] Installing gnupg2-dirmngr-0:2 100% | 20.2 MiB/s | 621.1 KiB | 00m00s [157/171] Installing gnupg2-0:2.4.8-2.f 100% | 168.0 MiB/s | 6.6 MiB | 00m00s [158/171] Installing rpm-sign-libs-0:5. 100% | 39.6 MiB/s | 40.6 KiB | 00m00s [159/171] Installing rpm-build-libs-0:5 100% | 131.5 MiB/s | 269.2 KiB | 00m00s [160/171] Installing gpgverify-0:2.2-2. 100% | 9.2 MiB/s | 9.4 KiB | 00m00s [161/171] Installing rpm-build-0:5.99.9 100% | 18.2 MiB/s | 298.4 KiB | 00m00s [162/171] Installing pyproject-srpm-mac 100% | 2.4 MiB/s | 2.5 KiB | 00m00s [163/171] Installing redhat-rpm-config- 100% | 61.2 MiB/s | 188.1 KiB | 00m00s [164/171] Installing forge-srpm-macros- 100% | 39.3 MiB/s | 40.3 KiB | 00m00s [165/171] Installing fonts-srpm-macros- 100% | 55.7 MiB/s | 57.0 KiB | 00m00s [166/171] Installing go-srpm-macros-0:3 100% | 61.3 MiB/s | 62.7 KiB | 00m00s [167/171] Installing python-srpm-macros 100% | 51.6 MiB/s | 52.8 KiB | 00m00s [168/171] Installing which-0:2.23-2.fc4 100% | 5.6 MiB/s | 85.7 KiB | 00m00s [169/171] Installing util-linux-0:2.41. 100% | 63.7 MiB/s | 3.6 MiB | 00m00s [170/171] Installing shadow-utils-2:4.1 100% | 84.5 MiB/s | 4.0 MiB | 00m00s [171/171] Installing info-0:7.2-4.fc43. 100% | 135.1 KiB/s | 354.3 KiB | 00m03s Warning: skipped OpenPGP checks for 3 packages from repository: copr_base Complete! Finish: installing minimal buildroot with dnf5 Start: creating root cache Finish: creating root cache Finish: chroot init INFO: Installed packages: INFO: add-determinism-0.6.0-1.fc43.x86_64 alternatives-1.33-1.fc43.x86_64 ansible-srpm-macros-1-17.1.fc42.noarch audit-libs-4.1.0-1.fc43.x86_64 bash-5.3.0-1.fc43.x86_64 binutils-2.44.90-2.fc43.x86_64 build-reproducibility-srpm-macros-0.6.0-1.fc43.noarch bzip2-1.0.8-20.fc42.x86_64 bzip2-libs-1.0.8-20.fc42.x86_64 ca-certificates-2024.2.69_v8.0.401-5.fc42.noarch coreutils-9.7-4.fc43.x86_64 coreutils-common-9.7-4.fc43.x86_64 cpio-2.15-2.fc41.x86_64 crypto-policies-20250714-1.gitcd6043a.fc43.noarch curl-8.15.0-1.fc43.x86_64 cyrus-sasl-lib-2.1.28-30.fc42.x86_64 debugedit-5.2-1.fc43.x86_64 diffutils-3.12-2.fc43.x86_64 dwz-0.16-1.fc43.x86_64 ed-1.21.1-1.fc43.x86_64 efi-srpm-macros-6-3.fc43.noarch elfutils-0.193-2.fc43.x86_64 elfutils-debuginfod-client-0.193-2.fc43.x86_64 elfutils-default-yama-scope-0.193-2.fc43.noarch elfutils-libelf-0.193-2.fc43.x86_64 elfutils-libs-0.193-2.fc43.x86_64 fedora-gpg-keys-43-0.2.noarch fedora-release-43-0.19.noarch fedora-release-common-43-0.19.noarch fedora-release-identity-basic-43-0.19.noarch fedora-repos-43-0.2.noarch fedora-repos-rawhide-43-0.2.noarch file-5.46-5.fc43.x86_64 file-libs-5.46-5.fc43.x86_64 filesystem-3.18-44.fc43.x86_64 filesystem-srpm-macros-3.18-44.fc43.noarch findutils-4.10.0-5.fc42.x86_64 fonts-srpm-macros-2.0.5-22.fc43.noarch forge-srpm-macros-0.4.0-2.fc42.noarch fpc-srpm-macros-1.3-14.fc42.noarch gawk-5.3.2-1.fc43.x86_64 gdb-minimal-16.3-3.fc43.x86_64 gdbm-libs-1.23-9.fc42.x86_64 ghc-srpm-macros-1.9.2-2.fc42.noarch glibc-2.41.9000-23.fc43.x86_64 glibc-common-2.41.9000-23.fc43.x86_64 glibc-gconv-extra-2.41.9000-23.fc43.x86_64 glibc-minimal-langpack-2.41.9000-23.fc43.x86_64 gmp-6.3.0-3.fc43.x86_64 gnat-srpm-macros-6-7.fc42.noarch gnupg2-2.4.8-2.fc43.x86_64 gnupg2-dirmngr-2.4.8-2.fc43.x86_64 gnupg2-gpg-agent-2.4.8-2.fc43.x86_64 gnupg2-gpgconf-2.4.8-2.fc43.x86_64 gnupg2-keyboxd-2.4.8-2.fc43.x86_64 gnupg2-verify-2.4.8-2.fc43.x86_64 gnutls-3.8.10-1.fc43.x86_64 go-srpm-macros-3.7.0-1.fc43.noarch gpg-pubkey-36f612dcf27f7d1a48a835e4dbfcf71c6d9f90a6-6786af3b gpg-pubkey-b0f4950458f69e1150c6c5edc8ac4916105ef944-65ca83d1 gpg-pubkey-c6e7f081cf80e13146676e88829b606631645531-66b6dccf gpgverify-2.2-2.fc43.noarch grep-3.12-1.fc43.x86_64 gzip-1.13-3.fc42.x86_64 ima-evm-utils-libs-1.6.2-5.fc43.x86_64 info-7.2-4.fc43.x86_64 jansson-2.14-2.fc42.x86_64 java-srpm-macros-1-6.fc43.noarch json-c-0.18-4.fc43.x86_64 kernel-srpm-macros-1.0-25.fc42.noarch keyutils-libs-1.6.3-5.fc42.x86_64 krb5-libs-1.21.3-6.fc43.x86_64 libacl-2.3.2-3.fc42.x86_64 libarchive-3.8.1-1.fc43.x86_64 libassuan-2.5.7-3.fc42.x86_64 libattr-2.5.2-5.fc42.x86_64 libblkid-2.41.1-11.fc43.x86_64 libbrotli-1.1.0-7.fc43.x86_64 libcap-2.76-1.fc43.x86_64 libcap-ng-0.8.5-5.fc43.x86_64 libcom_err-1.47.3-1.fc43.x86_64 libcurl-8.15.0-1.fc43.x86_64 libeconf-0.7.9-1.fc43.x86_64 libevent-2.1.12-15.fc42.x86_64 libfdisk-2.41.1-11.fc43.x86_64 libffi-3.5.1-1.fc43.x86_64 libfsverity-1.6-2.fc42.x86_64 libgcc-15.1.1-3.fc43.x86_64 libgcrypt-1.11.1-1.fc43.x86_64 libgomp-15.1.1-3.fc43.x86_64 libgpg-error-1.55-1.fc43.x86_64 libidn2-2.3.8-1.fc43.x86_64 libksba-1.6.7-3.fc42.x86_64 liblastlog2-2.41.1-11.fc43.x86_64 libmount-2.41.1-11.fc43.x86_64 libnghttp2-1.66.0-1.fc43.x86_64 libpkgconf-2.3.0-2.fc42.x86_64 libpsl-0.21.5-5.fc42.x86_64 libselinux-3.9-1.fc43.x86_64 libsemanage-3.9-1.fc43.x86_64 libsepol-3.9-1.fc43.x86_64 libsmartcols-2.41.1-11.fc43.x86_64 libssh-0.11.2-1.fc43.x86_64 libssh-config-0.11.2-1.fc43.noarch libstdc++-15.1.1-3.fc43.x86_64 libtasn1-4.20.0-1.fc43.x86_64 libtool-ltdl-2.5.4-5.fc43.x86_64 libunistring-1.1-9.fc42.x86_64 libusb1-1.0.28-2.fc43.x86_64 libuuid-2.41.1-11.fc43.x86_64 libverto-0.3.2-10.fc42.x86_64 libxcrypt-4.4.38-7.fc43.x86_64 libxml2-2.12.10-2.fc43.x86_64 libzstd-1.5.7-1.fc43.x86_64 lua-libs-5.4.8-1.fc43.x86_64 lua-srpm-macros-1-15.fc42.noarch lz4-libs-1.10.0-2.fc42.x86_64 mpfr-4.2.2-1.fc43.x86_64 ncurses-base-6.5-6.20250614.fc43.noarch ncurses-libs-6.5-6.20250614.fc43.x86_64 nettle-3.10.1-1.fc43.x86_64 npth-1.8-2.fc42.x86_64 ocaml-srpm-macros-10-4.fc42.noarch openblas-srpm-macros-2-19.fc42.noarch openldap-2.6.10-2.fc43.x86_64 openssl-libs-3.5.1-1.fc43.x86_64 p11-kit-0.25.5-8.fc43.x86_64 p11-kit-trust-0.25.5-8.fc43.x86_64 package-notes-srpm-macros-0.5-13.fc42.noarch pam-libs-1.7.1-2.fc43.x86_64 patch-2.8-1.fc43.x86_64 pcre2-10.45-1.fc43.x86_64 pcre2-syntax-10.45-1.fc43.noarch perl-srpm-macros-1-59.fc43.noarch pkgconf-2.3.0-2.fc42.x86_64 pkgconf-m4-2.3.0-2.fc42.noarch pkgconf-pkg-config-2.3.0-2.fc42.x86_64 popt-1.19-8.fc42.x86_64 publicsuffix-list-dafsa-20250616-1.fc43.noarch pyproject-srpm-macros-1.18.3-1.fc43.noarch python-srpm-macros-3.14-3.fc43.noarch qt5-srpm-macros-5.15.17-1.fc43.noarch qt6-srpm-macros-6.9.1-1.fc43.noarch readline-8.3-1.fc43.x86_64 redhat-rpm-config-343-7.fc43.noarch rpm-5.99.91-1.fc43.x86_64 rpm-build-5.99.91-1.fc43.x86_64 rpm-build-libs-5.99.91-1.fc43.x86_64 rpm-libs-5.99.91-1.fc43.x86_64 rpm-sequoia-1.9.0-1.fc43.x86_64 rpm-sign-libs-5.99.91-1.fc43.x86_64 rust-srpm-macros-26.3-4.fc42.noarch sed-4.9-4.fc42.x86_64 setup-2.15.0-25.fc43.noarch shadow-utils-4.18.0-1.fc43.x86_64 sqlite-libs-3.50.2-1.fc43.x86_64 systemd-libs-257.7-1.fc43.x86_64 systemd-standalone-sysusers-257.7-1.fc43.x86_64 tar-1.35-5.fc42.x86_64 tpm2-tss-4.1.3-7.fc43.x86_64 tree-sitter-srpm-macros-0.4.1-1.fc43.noarch unzip-6.0-66.fc42.x86_64 util-linux-2.41.1-11.fc43.x86_64 util-linux-core-2.41.1-11.fc43.x86_64 which-2.23-2.fc43.x86_64 xxhash-libs-0.8.3-2.fc42.x86_64 xz-5.8.1-1.fc43.x86_64 xz-libs-5.8.1-1.fc43.x86_64 zig-srpm-macros-1-4.fc42.noarch zip-3.0-43.fc42.x86_64 zlib-ng-compat-2.2.4-2.fc43.x86_64 zstd-1.5.7-1.fc43.x86_64 Start: buildsrpm Start: rpmbuild -bs Building target platforms: x86_64 Building for target x86_64 setting SOURCE_DATE_EPOCH=1753142400 Wrote: /builddir/build/SRPMS/rccl-6.4.2-1.fc43.src.rpm Finish: rpmbuild -bs INFO: chroot_scan: 1 files copied to /var/lib/copr-rpmbuild/results/chroot_scan INFO: /var/lib/mock/fedora-rawhide-x86_64-1753289447.166372/root/var/log/dnf5.log INFO: chroot_scan: creating tarball /var/lib/copr-rpmbuild/results/chroot_scan.tar.gz /bin/tar: Removing leading `/' from member names Finish: buildsrpm INFO: Done(/var/lib/copr-rpmbuild/workspace/workdir-q88lb_0o/rccl/rccl.spec) Config(child) 0 minutes 29 seconds INFO: Results and/or logs in: /var/lib/copr-rpmbuild/results INFO: Cleaning up build root ('cleanup_on_success=True') Start: clean chroot INFO: unmounting tmpfs. Finish: clean chroot INFO: Start(/var/lib/copr-rpmbuild/results/rccl-6.4.2-1.fc43.src.rpm) Config(fedora-rawhide-x86_64) Start(bootstrap): chroot init INFO: mounting tmpfs at /var/lib/mock/fedora-rawhide-x86_64-bootstrap-1753289447.166372/root. INFO: reusing tmpfs at /var/lib/mock/fedora-rawhide-x86_64-bootstrap-1753289447.166372/root. INFO: calling preinit hooks INFO: enabled root cache INFO: enabled package manager cache Start(bootstrap): cleaning package manager metadata Finish(bootstrap): cleaning package manager metadata Finish(bootstrap): chroot init Start: chroot init INFO: mounting tmpfs at /var/lib/mock/fedora-rawhide-x86_64-1753289447.166372/root. INFO: calling preinit hooks INFO: enabled root cache Start: unpacking root cache Finish: unpacking root cache INFO: enabled package manager cache Start: cleaning package manager metadata Finish: cleaning package manager metadata INFO: enabled HW Info plugin INFO: Buildroot is handled by package management downloaded with a bootstrap image: rpm-5.99.91-1.fc43.x86_64 rpm-sequoia-1.9.0-1.fc43.x86_64 dnf5-5.2.15.0-1.fc43.x86_64 dnf5-plugins-5.2.15.0-1.fc43.x86_64 Finish: chroot init Start: build phase for rccl-6.4.2-1.fc43.src.rpm Start: build setup for rccl-6.4.2-1.fc43.src.rpm Building target platforms: x86_64 Building for target x86_64 setting SOURCE_DATE_EPOCH=1753142400 Wrote: /builddir/build/SRPMS/rccl-6.4.2-1.fc43.src.rpm Updating and loading repositories: Copr repository 100% | 45.0 KiB/s | 1.5 KiB | 00m00s fedora 100% | 379.1 KiB/s | 24.3 KiB | 00m00s Repositories loaded. Package Arch Version Repository Size Installing: cmake x86_64 3.31.6-3.fc43 fedora 34.5 MiB gcc-c++ x86_64 15.1.1-3.fc43 copr_base 41.3 MiB hipify x86_64 6.4.1-2.fc43 copr_base 3.1 MiB rocm-cmake noarch 6.4.0-1.fc43 copr_base 130.5 KiB rocm-comgr-devel x86_64 19-12.rocm6.4.2.fc43 copr_base 98.2 KiB rocm-core-devel x86_64 6.4.2-1.fc43 copr_base 14.8 KiB rocm-hip-devel x86_64 6.4.2-1.fc43 copr_base 2.8 MiB rocm-rpm-macros noarch 6.4.0-4.fc43 fedora 18.9 KiB rocm-runtime-devel x86_64 6.4.2-1.fc43 copr_base 571.4 KiB rocm-smi-devel x86_64 6.4.2-1.fc43 copr_base 281.8 KiB Installing dependencies: annobin-docs noarch 12.98-1.fc43 fedora 98.9 KiB annobin-plugin-gcc x86_64 12.98-1.fc43 fedora 1.0 MiB cmake-data noarch 3.31.6-3.fc43 fedora 8.5 MiB cmake-filesystem x86_64 3.31.6-3.fc43 fedora 0.0 B cmake-rpm-macros noarch 3.31.6-3.fc43 fedora 7.7 KiB cpp x86_64 15.1.1-3.fc43 copr_base 37.9 MiB emacs-filesystem noarch 1:30.0-4.fc42 fedora 0.0 B environment-modules x86_64 5.5.0-3.fc42 fedora 1.8 MiB expat x86_64 2.7.1-1.fc43 fedora 294.2 KiB gcc x86_64 15.1.1-3.fc43 copr_base 111.2 MiB gcc-plugin-annobin x86_64 15.1.1-3.fc43 copr_base 57.2 KiB git x86_64 2.50.1-1.fc43 fedora 85.1 KiB git-core x86_64 2.50.1-1.fc43 fedora 23.5 MiB git-core-doc noarch 2.50.1-1.fc43 fedora 17.7 MiB glibc-devel x86_64 2.41.9000-23.fc43 fedora 2.3 MiB groff-base x86_64 1.23.0-8.fc42 fedora 3.9 MiB hipcc x86_64 19-12.rocm6.4.2.fc43 copr_base 653.0 KiB hwdata noarch 0.397-1.fc43 fedora 9.6 MiB jsoncpp x86_64 1.9.6-1.fc43 fedora 261.6 KiB kernel-headers x86_64 6.16.0-0.rc7.58.fc43 fedora 6.7 MiB less x86_64 679-1.fc43 fedora 406.1 KiB libcbor x86_64 0.12.0-5.fc43 fedora 77.8 KiB libdb x86_64 5.3.28-65.fc43 fedora 1.9 MiB libdrm x86_64 2.4.125-1.fc43 fedora 395.8 KiB libdrm-devel x86_64 2.4.125-1.fc43 fedora 728.8 KiB libedit x86_64 3.1-55.20250104cvs.fc42 fedora 244.1 KiB libfido2 x86_64 1.16.0-2.fc43 fedora 238.5 KiB libmpc x86_64 1.3.1-7.fc42 fedora 164.5 KiB libpciaccess x86_64 0.16-15.fc42 fedora 44.5 KiB libpciaccess-devel x86_64 0.16-15.fc42 fedora 15.3 KiB libpipeline x86_64 1.5.8-2.fc42 fedora 145.1 KiB libstdc++-devel x86_64 15.1.1-3.fc43 copr_base 16.1 MiB libtommath x86_64 1.3.1~rc1-5.fc42 fedora 130.4 KiB libuv x86_64 1:1.51.0-1.fc43 fedora 570.2 KiB libxcrypt-devel x86_64 4.4.38-7.fc43 fedora 30.8 KiB make x86_64 1:4.4.1-10.fc42 fedora 1.8 MiB man-db x86_64 2.13.1-1.fc43 fedora 2.9 MiB mpdecimal x86_64 4.0.1-1.fc43 fedora 217.2 KiB ncurses x86_64 6.5-6.20250614.fc43 fedora 609.8 KiB numactl-libs x86_64 2.0.19-2.fc42 fedora 52.9 KiB openssh x86_64 10.0p1-4.fc43 fedora 1.4 MiB openssh-clients x86_64 10.0p1-4.fc43 fedora 2.6 MiB perl x86_64 4:5.42.0-519.fc43 fedora 0.0 B perl-Algorithm-Diff noarch 1.2010-13.fc42 fedora 107.5 KiB perl-Archive-Tar noarch 3.04-520.fc43 fedora 154.4 KiB perl-Archive-Zip noarch 1.68-16.fc42 fedora 291.1 KiB perl-Attribute-Handlers noarch 1.03-519.fc43 fedora 39.9 KiB perl-AutoLoader noarch 5.74-519.fc43 fedora 20.6 KiB perl-AutoSplit noarch 5.74-519.fc43 fedora 23.1 KiB perl-B x86_64 1.89-519.fc43 fedora 501.3 KiB perl-Benchmark noarch 1.27-519.fc43 fedora 36.4 KiB perl-CPAN noarch 2.38-520.fc43 fedora 1.9 MiB perl-CPAN-Meta noarch 2.150010-519.fc43 fedora 592.2 KiB perl-CPAN-Meta-Requirements noarch 2.143-12.fc43 fedora 81.2 KiB perl-CPAN-Meta-YAML noarch 0.020-520.fc43 fedora 52.1 KiB perl-Carp noarch 1.54-519.fc43 fedora 46.6 KiB perl-Class-Struct noarch 0.68-519.fc43 fedora 25.4 KiB perl-Compress-Bzip2 x86_64 2.28-23.fc43 fedora 142.6 KiB perl-Compress-Raw-Bzip2 x86_64 2.213-520.fc43 fedora 67.3 KiB perl-Compress-Raw-Lzma x86_64 2.213-6.fc43 fedora 120.9 KiB perl-Compress-Raw-Zlib x86_64 2.213-520.fc43 fedora 163.2 KiB perl-Config-Extensions noarch 0.03-519.fc43 fedora 2.7 KiB perl-Config-Perl-V noarch 0.38-520.fc43 fedora 25.9 KiB perl-DBM_Filter noarch 0.07-519.fc43 fedora 28.7 KiB perl-DB_File x86_64 1.859-515.fc43 fedora 188.8 KiB perl-Data-Dumper x86_64 2.191-520.fc43 fedora 115.6 KiB perl-Data-OptList noarch 0.114-6.fc42 fedora 50.1 KiB perl-Data-Section noarch 0.200008-7.fc42 fedora 42.7 KiB perl-Devel-PPPort x86_64 3.73-520.fc43 fedora 889.8 KiB perl-Devel-Peek x86_64 1.36-519.fc43 fedora 43.5 KiB perl-Devel-SelfStubber noarch 1.06-519.fc43 fedora 6.8 KiB perl-Devel-Size x86_64 0.85-2.fc43 fedora 42.0 KiB perl-Digest noarch 1.20-519.fc43 fedora 35.3 KiB perl-Digest-MD5 x86_64 2.59-519.fc43 fedora 59.7 KiB perl-Digest-SHA x86_64 1:6.04-520.fc43 fedora 112.5 KiB perl-DirHandle noarch 1.05-519.fc43 fedora 3.4 KiB perl-Dumpvalue noarch 2.27-519.fc43 fedora 19.8 KiB perl-DynaLoader x86_64 1.57-519.fc43 fedora 32.1 KiB perl-Encode x86_64 4:3.21-519.fc43 fedora 4.7 MiB perl-Encode-devel x86_64 4:3.21-519.fc43 fedora 99.6 KiB perl-English noarch 1.11-519.fc43 fedora 6.2 KiB perl-Env noarch 1.06-519.fc43 fedora 26.1 KiB perl-Errno x86_64 1.38-519.fc43 fedora 8.4 KiB perl-Error noarch 1:0.17030-1.fc43 fedora 76.7 KiB perl-Exporter noarch 5.79-519.fc43 fedora 54.3 KiB perl-ExtUtils-CBuilder noarch 1:0.280242-519.fc43 fedora 97.3 KiB perl-ExtUtils-Command noarch 2:7.76-520.fc43 fedora 9.6 KiB perl-ExtUtils-Constant noarch 0.25-519.fc43 fedora 85.9 KiB perl-ExtUtils-Embed noarch 1.35-519.fc43 fedora 15.6 KiB perl-ExtUtils-Install noarch 2.22-519.fc43 fedora 85.5 KiB perl-ExtUtils-MM-Utils noarch 2:7.76-520.fc43 fedora 2.9 KiB perl-ExtUtils-MakeMaker noarch 2:7.76-520.fc43 fedora 739.7 KiB perl-ExtUtils-Manifest noarch 1:1.75-519.fc43 fedora 84.8 KiB perl-ExtUtils-Miniperl noarch 1.14-519.fc43 fedora 8.3 KiB perl-ExtUtils-ParseXS noarch 1:3.58-1.fc43 fedora 539.6 KiB perl-Fcntl x86_64 1.20-519.fc43 fedora 48.8 KiB perl-File-Basename noarch 2.86-519.fc43 fedora 14.0 KiB perl-File-Compare noarch 1.100.800-519.fc43 fedora 5.6 KiB perl-File-Copy noarch 2.41-519.fc43 fedora 19.7 KiB perl-File-DosGlob x86_64 1.12-519.fc43 fedora 20.8 KiB perl-File-Fetch noarch 1.08-2.fc43 fedora 60.3 KiB perl-File-Find noarch 1.44-519.fc43 fedora 42.0 KiB perl-File-HomeDir noarch 1.006-14.fc42 fedora 119.3 KiB perl-File-Path noarch 2.18-519.fc43 fedora 63.5 KiB perl-File-Temp noarch 1:0.231.100-519.fc43 fedora 162.3 KiB perl-File-Which noarch 1.27-13.fc42 fedora 30.4 KiB perl-File-stat noarch 1.14-519.fc43 fedora 12.5 KiB perl-FileCache noarch 1.10-519.fc43 fedora 7.5 KiB perl-FileHandle noarch 2.05-519.fc43 fedora 9.4 KiB perl-Filter x86_64 2:1.64-520.fc43 fedora 156.7 KiB perl-Filter-Simple noarch 0.96-519.fc43 fedora 50.7 KiB perl-FindBin noarch 1.54-519.fc43 fedora 6.8 KiB perl-GDBM_File x86_64 1:1.24-519.fc43 fedora 79.6 KiB perl-Getopt-Long noarch 1:2.58-519.fc43 fedora 144.5 KiB perl-Getopt-Std noarch 1.14-519.fc43 fedora 11.2 KiB perl-Git noarch 2.50.1-1.fc43 fedora 64.0 KiB perl-HTTP-Tiny noarch 0.090-520.fc43 fedora 154.4 KiB perl-Hash-Util x86_64 0.32-519.fc43 fedora 55.0 KiB perl-Hash-Util-FieldHash x86_64 1.27-519.fc43 fedora 62.6 KiB perl-I18N-Collate noarch 1.02-519.fc43 fedora 7.1 KiB perl-I18N-LangTags noarch 0.45-519.fc43 fedora 82.4 KiB perl-I18N-Langinfo x86_64 0.24-519.fc43 fedora 34.7 KiB perl-IO x86_64 1.55-519.fc43 fedora 147.4 KiB perl-IO-Compress noarch 2.213-520.fc43 fedora 1.0 MiB perl-IO-Compress-Lzma noarch 2.213-2.fc42 fedora 215.2 KiB perl-IO-Socket-IP noarch 0.43-520.fc43 fedora 100.3 KiB perl-IO-Socket-SSL noarch 2.095-1.fc43 fedora 714.5 KiB perl-IO-Zlib noarch 1:1.15-519.fc43 fedora 25.8 KiB perl-IPC-Cmd noarch 2:1.04-520.fc43 fedora 84.9 KiB perl-IPC-Open3 noarch 1.24-519.fc43 fedora 27.7 KiB perl-IPC-SysV x86_64 2.09-520.fc43 fedora 73.7 KiB perl-IPC-System-Simple noarch 1.30-15.fc42 fedora 71.7 KiB perl-JSON-PP noarch 1:4.16-520.fc43 fedora 141.8 KiB perl-Locale-Maketext noarch 1.33-520.fc43 fedora 171.3 KiB perl-Locale-Maketext-Simple noarch 1:0.21-519.fc43 fedora 12.8 KiB perl-MIME-Base32 noarch 1.303-23.fc42 fedora 30.7 KiB perl-MIME-Base64 x86_64 3.16-519.fc43 fedora 42.0 KiB perl-MRO-Compat noarch 0.15-11.fc42 fedora 43.0 KiB perl-Math-BigInt noarch 1:2.0050.03-2.fc43 fedora 1.1 MiB perl-Math-BigInt-FastCalc x86_64 0.502.000-519.fc43 fedora 44.0 KiB perl-Math-Complex noarch 1.63-519.fc43 fedora 85.1 KiB perl-Memoize noarch 1.17-519.fc43 fedora 64.7 KiB perl-Module-Build noarch 2:0.42.34-8.fc42 fedora 654.2 KiB perl-Module-CoreList noarch 1:5.20250720-1.fc43 fedora 1.2 MiB perl-Module-CoreList-tools noarch 1:5.20250720-1.fc43 fedora 18.6 KiB perl-Module-Load noarch 1:0.36-519.fc43 fedora 14.9 KiB perl-Module-Load-Conditional noarch 0.74-519.fc43 fedora 28.7 KiB perl-Module-Loaded noarch 1:0.08-519.fc43 fedora 5.0 KiB perl-Module-Metadata noarch 1.000038-519.fc43 fedora 67.5 KiB perl-Module-Signature noarch 0.93-1.fc43 fedora 136.5 KiB perl-NDBM_File x86_64 1.18-519.fc43 fedora 28.5 KiB perl-NEXT noarch 0.69-519.fc43 fedora 23.6 KiB perl-Net noarch 1.04-519.fc43 fedora 22.4 KiB perl-Net-Ping noarch 2.76-519.fc43 fedora 134.2 KiB perl-Net-SSLeay x86_64 1.94-10.fc43 fedora 1.3 MiB perl-ODBM_File x86_64 1.20-519.fc43 fedora 28.5 KiB perl-Opcode x86_64 1.69-519.fc43 fedora 48.6 KiB perl-POSIX x86_64 2.23-519.fc43 fedora 231.4 KiB perl-Package-Generator noarch 1.106-33.fc42 fedora 29.9 KiB perl-Params-Check noarch 1:0.38-519.fc43 fedora 27.6 KiB perl-Params-Util x86_64 1.102-18.fc43 fedora 58.5 KiB perl-PathTools x86_64 3.94-519.fc43 fedora 180.0 KiB perl-Perl-OSType noarch 1.010-520.fc43 fedora 32.8 KiB perl-PerlIO-via-QuotedPrint noarch 0.10-519.fc43 fedora 30.2 KiB perl-Pod-Checker noarch 4:1.77-519.fc43 fedora 52.2 KiB perl-Pod-Escapes noarch 1:1.07-519.fc43 fedora 24.9 KiB perl-Pod-Functions noarch 1.14-519.fc43 fedora 14.4 KiB perl-Pod-Html noarch 1.35-519.fc43 fedora 42.3 KiB perl-Pod-Perldoc noarch 3.28.01-520.fc43 fedora 163.7 KiB perl-Pod-Simple noarch 1:3.47-2.fc43 fedora 565.2 KiB perl-Pod-Usage noarch 4:2.05-519.fc43 fedora 86.3 KiB perl-Safe noarch 2.47-519.fc43 fedora 30.7 KiB perl-Scalar-List-Utils x86_64 5:1.69-519.fc43 fedora 144.8 KiB perl-Search-Dict noarch 1.08-519.fc43 fedora 4.7 KiB perl-SelectSaver noarch 1.02-519.fc43 fedora 2.2 KiB perl-SelfLoader noarch 1.28-519.fc43 fedora 22.2 KiB perl-Socket x86_64 4:2.040-1.fc43 fedora 120.3 KiB perl-Software-License noarch 0.104007-1.fc43 fedora 500.7 KiB perl-Storable x86_64 1:3.37-520.fc43 fedora 231.2 KiB perl-Sub-Exporter noarch 0.991-5.fc42 fedora 194.9 KiB perl-Sub-Install noarch 0.929-7.fc42 fedora 35.9 KiB perl-Symbol noarch 1.09-519.fc43 fedora 6.8 KiB perl-Sys-Hostname x86_64 1.25-519.fc43 fedora 15.8 KiB perl-Sys-Syslog x86_64 0.36-520.fc43 fedora 94.7 KiB perl-Term-ANSIColor noarch 5.01-520.fc43 fedora 97.5 KiB perl-Term-Cap noarch 1.18-519.fc43 fedora 29.3 KiB perl-Term-Complete noarch 1.403-519.fc43 fedora 5.8 KiB perl-Term-ReadLine noarch 1.17-519.fc43 fedora 17.3 KiB perl-Term-Table noarch 0.024-519.fc43 fedora 77.8 KiB perl-TermReadKey x86_64 2.38-25.fc43 fedora 64.0 KiB perl-Test noarch 1.31-519.fc43 fedora 37.0 KiB perl-Test-Harness noarch 1:3.52-3.fc43 fedora 560.8 KiB perl-Test-Simple noarch 3:1.302214-3.fc43 fedora 1.7 MiB perl-Text-Abbrev noarch 1.02-519.fc43 fedora 3.1 KiB perl-Text-Balanced noarch 2.06-519.fc43 fedora 111.4 KiB perl-Text-Diff noarch 1.45-23.fc42 fedora 83.0 KiB perl-Text-Glob noarch 0.11-25.fc42 fedora 8.4 KiB perl-Text-ParseWords noarch 3.31-519.fc43 fedora 13.6 KiB perl-Text-Tabs+Wrap noarch 2024.001-519.fc43 fedora 22.6 KiB perl-Text-Template noarch 1.61-7.fc42 fedora 112.4 KiB perl-Thread noarch 3.06-519.fc43 fedora 12.1 KiB perl-Thread-Queue noarch 3.14-519.fc43 fedora 28.9 KiB perl-Thread-Semaphore noarch 2.13-519.fc43 fedora 10.0 KiB perl-Tie noarch 4.6-519.fc43 fedora 32.1 KiB perl-Tie-File noarch 1.10-519.fc43 fedora 85.6 KiB perl-Tie-Memoize noarch 1.1-519.fc43 fedora 6.2 KiB perl-Tie-RefHash noarch 1.41-519.fc43 fedora 35.9 KiB perl-Time noarch 1.04-519.fc43 fedora 9.8 KiB perl-Time-HiRes x86_64 4:1.9778-519.fc43 fedora 115.8 KiB perl-Time-Local noarch 2:1.350-519.fc43 fedora 68.9 KiB perl-Time-Piece x86_64 1.3600-519.fc43 fedora 71.2 KiB perl-URI noarch 5.32-1.fc43 fedora 261.2 KiB perl-Unicode-Collate x86_64 1.31-519.fc43 fedora 4.2 MiB perl-Unicode-Normalize x86_64 1.32-519.fc43 fedora 486.1 KiB perl-Unicode-UCD noarch 0.81-519.fc43 fedora 206.4 KiB perl-User-pwent noarch 1.05-519.fc43 fedora 17.1 KiB perl-autodie noarch 2.37-520.fc43 fedora 214.9 KiB perl-autouse noarch 1.11-519.fc43 fedora 5.9 KiB perl-base noarch 2.27-519.fc43 fedora 12.6 KiB perl-bignum noarch 0.67-520.fc43 fedora 133.1 KiB perl-blib noarch 1.07-519.fc43 fedora 3.2 KiB perl-constant noarch 1.33-520.fc43 fedora 26.2 KiB perl-debugger noarch 1.60-519.fc43 fedora 403.2 KiB perl-deprecate noarch 0.04-519.fc43 fedora 6.6 KiB perl-devel x86_64 4:5.42.0-519.fc43 fedora 3.8 MiB perl-diagnostics noarch 1.40-519.fc43 fedora 471.0 KiB perl-doc noarch 5.42.0-519.fc43 fedora 11.5 MiB perl-encoding x86_64 4:3.00-519.fc43 fedora 149.4 KiB perl-encoding-warnings noarch 0.14-519.fc43 fedora 10.1 KiB perl-experimental noarch 0.036-1.fc43 fedora 43.4 KiB perl-fields noarch 2.27-519.fc43 fedora 11.9 KiB perl-filetest noarch 1.03-519.fc43 fedora 6.4 KiB perl-if noarch 0.61.000-519.fc43 fedora 5.8 KiB perl-inc-latest noarch 2:0.500-30.fc42 fedora 34.6 KiB perl-interpreter x86_64 4:5.42.0-519.fc43 fedora 118.6 KiB perl-less noarch 0.03-519.fc43 fedora 4.9 KiB perl-lib x86_64 0.65-519.fc43 fedora 8.5 KiB perl-libnet noarch 3.15-520.fc43 fedora 289.4 KiB perl-libnetcfg noarch 4:5.42.0-519.fc43 fedora 16.9 KiB perl-libs x86_64 4:5.42.0-519.fc43 fedora 11.5 MiB perl-local-lib noarch 2.000029-9.fc42 fedora 117.6 KiB perl-locale noarch 1.13-519.fc43 fedora 6.1 KiB perl-macros noarch 4:5.42.0-519.fc43 fedora 5.5 KiB perl-meta-notation noarch 5.42.0-519.fc43 fedora 2.0 KiB perl-mro x86_64 1.29-519.fc43 fedora 41.6 KiB perl-open noarch 1.13-519.fc43 fedora 11.3 KiB perl-overload noarch 1.40-519.fc43 fedora 71.6 KiB perl-overloading noarch 0.02-519.fc43 fedora 4.9 KiB perl-parent noarch 1:0.244-519.fc43 fedora 10.3 KiB perl-perlfaq noarch 5.20250619-519.fc43 fedora 733.6 KiB perl-ph x86_64 5.42.0-519.fc43 fedora 276.4 KiB perl-podlators noarch 1:6.0.2-519.fc43 fedora 317.4 KiB perl-sigtrap noarch 1.10-519.fc43 fedora 11.1 KiB perl-sort noarch 2.06-519.fc43 fedora 4.8 KiB perl-subs noarch 1.04-519.fc43 fedora 2.1 KiB perl-threads x86_64 1:2.43-519.fc43 fedora 115.1 KiB perl-threads-shared x86_64 1.70-519.fc43 fedora 83.6 KiB perl-utils noarch 5.42.0-519.fc43 fedora 97.0 KiB perl-vars noarch 1.05-519.fc43 fedora 3.9 KiB perl-version x86_64 9:0.99.33-520.fc43 fedora 128.7 KiB perl-vmsish noarch 1.04-519.fc43 fedora 6.6 KiB procps-ng x86_64 4.0.4-6.fc42 fedora 1.0 MiB python-pip-wheel noarch 25.1.1-13.fc43 fedora 1.2 MiB python3 x86_64 3.14.0~b4-1.fc43 fedora 28.9 KiB python3-libs x86_64 3.14.0~b4-1.fc43 fedora 42.9 MiB python3-pyparsing noarch 3.1.2-11.fc43 fedora 1.0 MiB rhash x86_64 1.4.5-2.fc42 fedora 351.0 KiB rocm-clang x86_64 19-12.rocm6.4.2.fc43 copr_base 70.2 MiB rocm-clang-devel x86_64 19-12.rocm6.4.2.fc43 copr_base 23.3 MiB rocm-clang-libs x86_64 19-12.rocm6.4.2.fc43 copr_base 98.4 MiB rocm-clang-runtime-devel x86_64 19-12.rocm6.4.2.fc43 copr_base 6.9 MiB rocm-comgr x86_64 19-12.rocm6.4.2.fc43 copr_base 123.9 MiB rocm-core x86_64 6.4.2-1.fc43 copr_base 12.3 KiB rocm-device-libs x86_64 19-12.rocm6.4.2.fc43 copr_base 3.2 MiB rocm-hip x86_64 6.4.2-1.fc43 copr_base 24.9 MiB rocm-libc++ x86_64 19-12.rocm6.4.2.fc43 copr_base 1.2 MiB rocm-libc++-devel x86_64 19-12.rocm6.4.2.fc43 copr_base 7.5 MiB rocm-lld x86_64 19-12.rocm6.4.2.fc43 copr_base 5.7 MiB rocm-llvm x86_64 19-12.rocm6.4.2.fc43 copr_base 48.5 MiB rocm-llvm-devel x86_64 19-12.rocm6.4.2.fc43 copr_base 25.3 MiB rocm-llvm-filesystem x86_64 19-12.rocm6.4.2.fc43 copr_base 0.0 B rocm-llvm-libs x86_64 19-12.rocm6.4.2.fc43 copr_base 84.8 MiB rocm-llvm-static x86_64 19-12.rocm6.4.2.fc43 copr_base 250.3 MiB rocm-runtime x86_64 6.4.2-1.fc43 copr_base 3.1 MiB rocm-smi x86_64 6.4.2-1.fc43 copr_base 2.7 MiB systemtap-sdt-devel x86_64 5.3-2.fc43 fedora 182.9 KiB systemtap-sdt-dtrace x86_64 5.3-2.fc43 fedora 179.6 KiB tcl x86_64 1:9.0.2-1.fc43 fedora 4.3 MiB tzdata noarch 2025b-1.fc43 fedora 1.6 MiB vim-filesystem noarch 2:9.1.1537-2.fc43 fedora 40.0 B zlib-ng-compat-devel x86_64 2.2.4-2.fc43 fedora 107.0 KiB Transaction Summary: Installing: 301 packages Total size of inbound packages is 295 MiB. Need to download 295 MiB. After this operation, 1 GiB extra will be used (install 1 GiB, remove 0 B). [ 1/301] hipify-0:6.4.1-2.fc43.x86_64 100% | 3.3 MiB/s | 505.5 KiB | 00m00s [ 2/301] gcc-c++-0:15.1.1-3.fc43.x86_6 100% | 63.0 MiB/s | 15.2 MiB | 00m00s [ 3/301] rocm-cmake-0:6.4.0-1.fc43.noa 100% | 399.6 KiB/s | 37.6 KiB | 00m00s [ 4/301] rocm-comgr-devel-0:19-12.rocm 100% | 2.6 MiB/s | 32.1 KiB | 00m00s [ 5/301] rocm-core-devel-0:6.4.2-1.fc4 100% | 448.7 KiB/s | 13.5 KiB | 00m00s [ 6/301] rocm-hip-devel-0:6.4.2-1.fc43 100% | 5.3 MiB/s | 233.6 KiB | 00m00s [ 7/301] rocm-runtime-devel-0:6.4.2-1. 100% | 5.4 MiB/s | 93.8 KiB | 00m00s [ 8/301] rocm-smi-devel-0:6.4.2-1.fc43 100% | 1.3 MiB/s | 57.3 KiB | 00m00s [ 9/301] rocm-rpm-macros-0:6.4.0-4.fc4 100% | 17.8 KiB/s | 15.9 KiB | 00m01s [ 10/301] cmake-filesystem-0:3.31.6-3.f 100% | 15.8 KiB/s | 16.4 KiB | 00m01s [ 11/301] expat-0:2.7.1-1.fc43.x86_64 100% | 266.5 KiB/s | 115.9 KiB | 00m00s [ 12/301] cmake-0:3.31.6-3.fc43.x86_64 100% | 4.2 MiB/s | 12.2 MiB | 00m03s [ 13/301] cmake-data-0:3.31.6-3.fc43.no 100% | 917.8 KiB/s | 2.5 MiB | 00m03s [ 14/301] jsoncpp-0:1.9.6-1.fc43.x86_64 100% | 100.4 KiB/s | 101.6 KiB | 00m01s [ 15/301] libuv-1:1.51.0-1.fc43.x86_64 100% | 376.2 KiB/s | 266.4 KiB | 00m01s [ 16/301] make-1:4.4.1-10.fc42.x86_64 100% | 1.0 MiB/s | 587.0 KiB | 00m01s [ 17/301] rhash-0:1.4.5-2.fc42.x86_64 100% | 883.1 KiB/s | 198.7 KiB | 00m00s [ 18/301] libstdc++-devel-0:15.1.1-3.fc 100% | 12.6 MiB/s | 2.7 MiB | 00m00s [ 19/301] perl-4:5.42.0-519.fc43.x86_64 100% | 78.0 KiB/s | 13.9 KiB | 00m00s [ 20/301] gcc-0:15.1.1-3.fc43.x86_64 100% | 76.3 MiB/s | 39.4 MiB | 00m01s [ 21/301] libmpc-0:1.3.1-7.fc42.x86_64 100% | 242.8 KiB/s | 70.9 KiB | 00m00s [ 22/301] perl-interpreter-4:5.42.0-519 100% | 288.3 KiB/s | 72.6 KiB | 00m00s [ 23/301] perl-File-Basename-0:2.86-519 100% | 317.2 KiB/s | 17.4 KiB | 00m00s [ 24/301] perl-File-Copy-0:2.41-519.fc4 100% | 118.6 KiB/s | 20.4 KiB | 00m00s [ 25/301] rocm-hip-0:6.4.2-1.fc43.x86_6 100% | 22.2 MiB/s | 9.5 MiB | 00m00s [ 26/301] rocm-comgr-0:19-12.rocm6.4.2. 100% | 63.6 MiB/s | 30.5 MiB | 00m00s [ 27/301] perl-File-Which-0:1.27-13.fc4 100% | 218.3 KiB/s | 21.6 KiB | 00m00s [ 28/301] perl-Getopt-Std-0:1.14-519.fc 100% | 284.9 KiB/s | 16.0 KiB | 00m00s [ 29/301] perl-PathTools-0:3.94-519.fc4 100% | 1.2 MiB/s | 87.3 KiB | 00m00s [ 30/301] perl-Scalar-List-Utils-5:1.69 100% | 289.2 KiB/s | 74.6 KiB | 00m00s [ 31/301] perl-URI-0:5.32-1.fc43.noarch 100% | 565.0 KiB/s | 143.5 KiB | 00m00s [ 32/301] rocm-runtime-0:6.4.2-1.fc43.x 100% | 27.6 MiB/s | 650.7 KiB | 00m00s [ 33/301] emacs-filesystem-1:30.0-4.fc4 100% | 20.2 KiB/s | 7.4 KiB | 00m00s [ 34/301] vim-filesystem-2:9.1.1537-2.f 100% | 38.5 KiB/s | 15.2 KiB | 00m00s [ 35/301] environment-modules-0:5.5.0-3 100% | 1.1 MiB/s | 764.7 KiB | 00m01s [ 36/301] cpp-0:15.1.1-3.fc43.x86_64 100% | 75.0 MiB/s | 12.9 MiB | 00m00s [ 37/301] perl-Attribute-Handlers-0:1.0 100% | 49.9 KiB/s | 28.3 KiB | 00m01s [ 38/301] perl-AutoLoader-0:5.74-519.fc 100% | 39.5 KiB/s | 21.5 KiB | 00m01s [ 39/301] perl-Archive-Tar-0:3.04-520.f 100% | 64.7 KiB/s | 71.1 KiB | 00m01s [ 40/301] perl-AutoSplit-0:5.74-519.fc4 100% | 46.8 KiB/s | 21.9 KiB | 00m00s [ 41/301] perl-Benchmark-0:1.27-519.fc4 100% | 136.6 KiB/s | 27.1 KiB | 00m00s [ 42/301] perl-B-0:1.89-519.fc43.x86_64 100% | 254.5 KiB/s | 177.9 KiB | 00m01s [ 43/301] perl-CPAN-0:2.38-520.fc43.noa 100% | 1.1 MiB/s | 567.4 KiB | 00m00s [ 44/301] perl-CPAN-Meta-Requirements-0 100% | 130.2 KiB/s | 34.6 KiB | 00m00s [ 45/301] perl-CPAN-Meta-0:2.150010-519 100% | 454.7 KiB/s | 191.0 KiB | 00m00s [ 46/301] perl-CPAN-Meta-YAML-0:0.020-5 100% | 213.5 KiB/s | 26.9 KiB | 00m00s [ 47/301] perl-Carp-0:1.54-519.fc43.noa 100% | 268.7 KiB/s | 28.8 KiB | 00m00s [ 48/301] perl-Class-Struct-0:0.68-519. 100% | 240.2 KiB/s | 22.3 KiB | 00m00s [ 49/301] perl-Compress-Raw-Bzip2-0:2.2 100% | 354.3 KiB/s | 36.1 KiB | 00m00s [ 50/301] perl-Config-Extensions-0:0.03 100% | 113.9 KiB/s | 12.5 KiB | 00m00s [ 51/301] perl-Config-Perl-V-0:0.38-520 100% | 202.0 KiB/s | 21.8 KiB | 00m00s [ 52/301] perl-Compress-Raw-Zlib-0:2.21 100% | 296.1 KiB/s | 65.1 KiB | 00m00s [ 53/301] perl-DBM_Filter-0:0.07-519.fc 100% | 343.8 KiB/s | 27.5 KiB | 00m00s [ 54/301] perl-Data-Dumper-0:2.191-520. 100% | 364.3 KiB/s | 56.5 KiB | 00m00s [ 55/301] perl-DB_File-0:1.859-515.fc43 100% | 430.9 KiB/s | 81.0 KiB | 00m00s [ 56/301] perl-Devel-PPPort-0:3.73-520. 100% | 1.0 MiB/s | 220.1 KiB | 00m00s [ 57/301] perl-Devel-Peek-0:1.36-519.fc 100% | 318.7 KiB/s | 32.2 KiB | 00m00s [ 58/301] perl-Devel-SelfStubber-0:1.06 100% | 180.2 KiB/s | 14.6 KiB | 00m00s [ 59/301] perl-Digest-0:1.20-519.fc43.n 100% | 460.7 KiB/s | 24.9 KiB | 00m00s [ 60/301] perl-Digest-MD5-0:2.59-519.fc 100% | 570.2 KiB/s | 35.9 KiB | 00m00s [ 61/301] perl-Digest-SHA-1:6.04-520.fc 100% | 729.3 KiB/s | 62.0 KiB | 00m00s [ 62/301] perl-DirHandle-0:1.05-519.fc4 100% | 172.0 KiB/s | 12.7 KiB | 00m00s [ 63/301] perl-Dumpvalue-0:2.27-519.fc4 100% | 241.5 KiB/s | 18.6 KiB | 00m00s [ 64/301] perl-DynaLoader-0:1.57-519.fc 100% | 453.2 KiB/s | 26.3 KiB | 00m00s [ 65/301] perl-English-0:1.11-519.fc43. 100% | 104.3 KiB/s | 13.9 KiB | 00m00s [ 66/301] perl-Errno-0:1.38-519.fc43.x8 100% | 130.0 KiB/s | 15.2 KiB | 00m00s [ 67/301] perl-Env-0:1.06-519.fc43.noar 100% | 160.9 KiB/s | 19.5 KiB | 00m00s [ 68/301] perl-Exporter-0:5.79-519.fc43 100% | 157.9 KiB/s | 30.9 KiB | 00m00s [ 69/301] perl-ExtUtils-CBuilder-1:0.28 100% | 199.8 KiB/s | 50.7 KiB | 00m00s [ 70/301] perl-ExtUtils-Command-2:7.76- 100% | 55.5 KiB/s | 14.1 KiB | 00m00s [ 71/301] perl-ExtUtils-Constant-0:0.25 100% | 77.4 KiB/s | 44.1 KiB | 00m01s [ 72/301] perl-ExtUtils-Embed-0:1.35-51 100% | 35.0 KiB/s | 18.0 KiB | 00m01s [ 73/301] perl-ExtUtils-Install-0:2.22- 100% | 81.8 KiB/s | 43.4 KiB | 00m01s [ 74/301] perl-ExtUtils-MM-Utils-2:7.76 100% | 153.7 KiB/s | 11.7 KiB | 00m00s [ 75/301] perl-ExtUtils-Manifest-1:1.75 100% | 241.6 KiB/s | 34.1 KiB | 00m00s [ 76/301] perl-ExtUtils-Miniperl-0:1.14 100% | 159.3 KiB/s | 15.3 KiB | 00m00s [ 77/301] perl-ExtUtils-MakeMaker-2:7.7 100% | 1.2 MiB/s | 294.6 KiB | 00m00s [ 78/301] perl-Fcntl-0:1.20-519.fc43.x8 100% | 273.2 KiB/s | 30.1 KiB | 00m00s [ 79/301] perl-File-Compare-0:1.100.800 100% | 276.0 KiB/s | 13.5 KiB | 00m00s [ 80/301] perl-ExtUtils-ParseXS-1:3.58- 100% | 1.1 MiB/s | 220.6 KiB | 00m00s [ 81/301] perl-File-DosGlob-0:1.12-519. 100% | 275.9 KiB/s | 19.9 KiB | 00m00s [ 82/301] perl-File-Fetch-0:1.08-2.fc43 100% | 428.1 KiB/s | 30.8 KiB | 00m00s [ 83/301] perl-File-Find-0:1.44-519.fc4 100% | 777.2 KiB/s | 25.6 KiB | 00m00s [ 84/301] perl-File-Path-0:2.18-519.fc4 100% | 475.0 KiB/s | 35.2 KiB | 00m00s [ 85/301] perl-File-Temp-1:0.231.100-51 100% | 616.3 KiB/s | 59.2 KiB | 00m00s [ 86/301] perl-File-stat-0:1.14-519.fc4 100% | 219.3 KiB/s | 17.3 KiB | 00m00s [ 87/301] perl-FileCache-0:1.10-519.fc4 100% | 238.0 KiB/s | 15.0 KiB | 00m00s [ 88/301] perl-FileHandle-0:2.05-519.fc 100% | 321.9 KiB/s | 15.8 KiB | 00m00s [ 89/301] perl-Filter-Simple-0:0.96-519 100% | 328.7 KiB/s | 27.0 KiB | 00m00s [ 90/301] perl-FindBin-0:1.54-519.fc43. 100% | 237.7 KiB/s | 14.5 KiB | 00m00s [ 91/301] perl-Filter-2:1.64-520.fc43.x 100% | 683.3 KiB/s | 86.1 KiB | 00m00s [ 92/301] perl-GDBM_File-1:1.24-519.fc4 100% | 1.3 MiB/s | 42.7 KiB | 00m00s [ 93/301] perl-Getopt-Long-1:2.58-519.f 100% | 826.6 KiB/s | 63.6 KiB | 00m00s [ 94/301] perl-HTTP-Tiny-0:0.090-520.fc 100% | 724.5 KiB/s | 56.5 KiB | 00m00s [ 95/301] perl-Hash-Util-0:0.32-519.fc4 100% | 435.3 KiB/s | 34.8 KiB | 00m00s [ 96/301] perl-Hash-Util-FieldHash-0:1. 100% | 629.6 KiB/s | 39.0 KiB | 00m00s [ 97/301] perl-I18N-Collate-0:1.02-519. 100% | 249.2 KiB/s | 14.5 KiB | 00m00s [ 98/301] perl-I18N-LangTags-0:0.45-519 100% | 652.8 KiB/s | 52.9 KiB | 00m00s [ 99/301] perl-I18N-Langinfo-0:0.24-519 100% | 365.0 KiB/s | 25.9 KiB | 00m00s [100/301] perl-IO-Socket-IP-0:0.43-520. 100% | 485.8 KiB/s | 42.3 KiB | 00m00s [101/301] perl-IO-0:1.55-519.fc43.x86_6 100% | 508.8 KiB/s | 82.4 KiB | 00m00s [102/301] perl-IO-Compress-0:2.213-520. 100% | 1.4 MiB/s | 305.5 KiB | 00m00s [103/301] perl-IO-Zlib-1:1.15-519.fc43. 100% | 163.1 KiB/s | 19.6 KiB | 00m00s [104/301] perl-IPC-Cmd-2:1.04-520.fc43. 100% | 382.6 KiB/s | 39.8 KiB | 00m00s [105/301] perl-IPC-Open3-0:1.24-519.fc4 100% | 711.4 KiB/s | 24.2 KiB | 00m00s [106/301] perl-IPC-SysV-0:2.09-520.fc43 100% | 1.2 MiB/s | 40.8 KiB | 00m00s [107/301] perl-Locale-Maketext-Simple-1 100% | 196.1 KiB/s | 17.8 KiB | 00m00s [108/301] perl-JSON-PP-1:4.16-520.fc43. 100% | 478.8 KiB/s | 65.6 KiB | 00m00s [109/301] perl-Locale-Maketext-0:1.33-5 100% | 774.2 KiB/s | 93.7 KiB | 00m00s [110/301] perl-MIME-Base64-0:3.16-519.f 100% | 805.1 KiB/s | 29.8 KiB | 00m00s [111/301] perl-Math-BigInt-FastCalc-0:0 100% | 329.1 KiB/s | 28.3 KiB | 00m00s [112/301] perl-Math-Complex-0:1.63-519. 100% | 587.8 KiB/s | 46.4 KiB | 00m00s [113/301] perl-Math-BigInt-1:2.0050.03- 100% | 1.5 MiB/s | 234.8 KiB | 00m00s [114/301] perl-Memoize-0:1.17-519.fc43. 100% | 632.6 KiB/s | 46.8 KiB | 00m00s [115/301] perl-Module-CoreList-tools-1: 100% | 186.5 KiB/s | 18.6 KiB | 00m00s [116/301] perl-Module-Load-1:0.36-519.f 100% | 162.1 KiB/s | 17.3 KiB | 00m00s [117/301] perl-Module-CoreList-1:5.2025 100% | 567.2 KiB/s | 93.0 KiB | 00m00s [118/301] perl-Module-Load-Conditional- 100% | 646.5 KiB/s | 22.0 KiB | 00m00s [119/301] perl-Module-Loaded-1:0.08-519 100% | 651.0 KiB/s | 13.7 KiB | 00m00s [120/301] perl-Module-Metadata-0:1.0000 100% | 817.9 KiB/s | 35.2 KiB | 00m00s [121/301] perl-NDBM_File-0:1.18-519.fc4 100% | 586.9 KiB/s | 22.9 KiB | 00m00s [122/301] perl-NEXT-0:0.69-519.fc43.noa 100% | 372.0 KiB/s | 21.2 KiB | 00m00s [123/301] perl-Net-0:1.04-519.fc43.noar 100% | 249.4 KiB/s | 22.9 KiB | 00m00s [124/301] perl-Net-Ping-0:2.76-519.fc43 100% | 462.6 KiB/s | 49.5 KiB | 00m00s [125/301] perl-ODBM_File-0:1.20-519.fc4 100% | 221.8 KiB/s | 23.1 KiB | 00m00s [126/301] perl-Opcode-0:1.69-519.fc43.x 100% | 404.3 KiB/s | 36.0 KiB | 00m00s [127/301] perl-Params-Check-1:0.38-519. 100% | 170.5 KiB/s | 21.7 KiB | 00m00s [128/301] perl-Perl-OSType-0:1.010-520. 100% | 206.5 KiB/s | 22.9 KiB | 00m00s [129/301] perl-POSIX-0:2.23-519.fc43.x8 100% | 456.2 KiB/s | 98.1 KiB | 00m00s [130/301] perl-PerlIO-via-QuotedPrint-0 100% | 174.3 KiB/s | 21.6 KiB | 00m00s [131/301] perl-Pod-Checker-4:1.77-519.f 100% | 316.6 KiB/s | 31.7 KiB | 00m00s [132/301] perl-Pod-Escapes-1:1.07-519.f 100% | 239.0 KiB/s | 19.8 KiB | 00m00s [133/301] perl-Pod-Functions-0:1.14-519 100% | 107.5 KiB/s | 14.9 KiB | 00m00s [134/301] perl-Pod-Html-0:1.35-519.fc43 100% | 216.0 KiB/s | 29.8 KiB | 00m00s [135/301] perl-Pod-Usage-4:2.05-519.fc4 100% | 903.9 KiB/s | 40.7 KiB | 00m00s [136/301] perl-Pod-Perldoc-0:3.28.01-52 100% | 509.3 KiB/s | 84.5 KiB | 00m00s [137/301] perl-Pod-Simple-1:3.47-2.fc43 100% | 616.6 KiB/s | 220.1 KiB | 00m00s [138/301] perl-Safe-0:2.47-519.fc43.noa 100% | 77.3 KiB/s | 25.2 KiB | 00m00s [139/301] perl-Search-Dict-0:1.08-519.f 100% | 41.6 KiB/s | 13.3 KiB | 00m00s [140/301] perl-SelectSaver-0:1.02-519.f 100% | 17.8 KiB/s | 12.0 KiB | 00m01s [141/301] perl-SelfLoader-0:1.28-519.fc 100% | 31.4 KiB/s | 21.7 KiB | 00m01s [142/301] perl-Socket-4:2.040-1.fc43.x8 100% | 74.6 KiB/s | 54.8 KiB | 00m01s [143/301] perl-Symbol-0:1.09-519.fc43.n 100% | 78.2 KiB/s | 14.5 KiB | 00m00s [144/301] perl-Sys-Hostname-0:1.25-519. 100% | 87.1 KiB/s | 17.4 KiB | 00m00s [145/301] perl-Storable-1:3.37-520.fc43 100% | 351.8 KiB/s | 98.5 KiB | 00m00s [146/301] perl-Sys-Syslog-0:0.36-520.fc 100% | 574.8 KiB/s | 46.6 KiB | 00m00s [147/301] perl-Term-ANSIColor-0:5.01-52 100% | 783.9 KiB/s | 47.8 KiB | 00m00s [148/301] perl-Term-Cap-0:1.18-519.fc43 100% | 343.4 KiB/s | 22.0 KiB | 00m00s [149/301] perl-Term-Complete-0:1.403-51 100% | 232.6 KiB/s | 13.3 KiB | 00m00s [150/301] perl-Term-ReadLine-0:1.17-519 100% | 495.1 KiB/s | 19.3 KiB | 00m00s [151/301] perl-Term-Table-0:0.024-519.f 100% | 862.1 KiB/s | 43.1 KiB | 00m00s [152/301] perl-Test-0:1.31-519.fc43.noa 100% | 246.5 KiB/s | 28.8 KiB | 00m00s [153/301] perl-Text-Abbrev-0:1.02-519.f 100% | 86.9 KiB/s | 12.4 KiB | 00m00s [154/301] perl-Test-Harness-1:3.52-3.fc 100% | 461.2 KiB/s | 277.7 KiB | 00m01s [155/301] perl-Test-Simple-3:1.302214-3 100% | 1.1 MiB/s | 863.2 KiB | 00m01s [156/301] perl-Text-Balanced-0:2.06-519 100% | 90.3 KiB/s | 48.7 KiB | 00m01s [157/301] perl-Text-ParseWords-0:3.31-5 100% | 47.0 KiB/s | 16.4 KiB | 00m00s [158/301] perl-Text-Tabs+Wrap-0:2024.00 100% | 115.5 KiB/s | 21.7 KiB | 00m00s [159/301] perl-Thread-0:3.06-519.fc43.n 100% | 78.8 KiB/s | 18.3 KiB | 00m00s [160/301] perl-Thread-Queue-0:3.14-519. 100% | 264.0 KiB/s | 21.4 KiB | 00m00s [161/301] perl-Thread-Semaphore-0:2.13- 100% | 201.5 KiB/s | 15.9 KiB | 00m00s [162/301] perl-Tie-0:4.6-519.fc43.noarc 100% | 638.7 KiB/s | 28.1 KiB | 00m00s [163/301] perl-Tie-File-0:1.10-519.fc43 100% | 946.2 KiB/s | 43.5 KiB | 00m00s [164/301] perl-Tie-Memoize-0:1.1-519.fc 100% | 261.5 KiB/s | 14.4 KiB | 00m00s [165/301] perl-Tie-RefHash-0:1.41-519.f 100% | 185.8 KiB/s | 23.6 KiB | 00m00s [166/301] perl-Time-0:1.04-519.fc43.noa 100% | 124.0 KiB/s | 17.1 KiB | 00m00s [167/301] perl-Time-HiRes-4:1.9778-519. 100% | 439.9 KiB/s | 57.2 KiB | 00m00s [168/301] perl-Time-Local-2:1.350-519.f 100% | 649.1 KiB/s | 34.4 KiB | 00m00s [169/301] perl-Time-Piece-0:1.3600-519. 100% | 967.1 KiB/s | 40.6 KiB | 00m00s [170/301] perl-Unicode-Collate-0:1.31-5 100% | 2.2 MiB/s | 644.6 KiB | 00m00s [171/301] perl-Unicode-Normalize-0:1.32 100% | 277.4 KiB/s | 74.1 KiB | 00m00s [172/301] perl-Unicode-UCD-0:0.81-519.f 100% | 322.3 KiB/s | 79.6 KiB | 00m00s [173/301] perl-User-pwent-0:1.05-519.fc 100% | 521.8 KiB/s | 19.8 KiB | 00m00s [174/301] perl-autouse-0:1.11-519.fc43. 100% | 133.9 KiB/s | 14.1 KiB | 00m00s [175/301] perl-base-0:2.27-519.fc43.noa 100% | 238.9 KiB/s | 16.5 KiB | 00m00s [176/301] perl-autodie-0:2.37-520.fc43. 100% | 897.0 KiB/s | 96.9 KiB | 00m00s [177/301] perl-bignum-0:0.67-520.fc43.n 100% | 1.5 MiB/s | 49.1 KiB | 00m00s [178/301] perl-blib-0:1.07-519.fc43.noa 100% | 191.9 KiB/s | 12.7 KiB | 00m00s [179/301] perl-constant-0:1.33-520.fc43 100% | 227.8 KiB/s | 23.0 KiB | 00m00s [180/301] perl-deprecate-0:0.04-519.fc4 100% | 133.8 KiB/s | 14.8 KiB | 00m00s [181/301] perl-debugger-0:1.60-519.fc43 100% | 583.7 KiB/s | 133.7 KiB | 00m00s [182/301] perl-devel-4:5.42.0-519.fc43. 100% | 1.9 MiB/s | 663.7 KiB | 00m00s [183/301] perl-diagnostics-0:1.40-519.f 100% | 613.3 KiB/s | 220.8 KiB | 00m00s [184/301] perl-encoding-4:3.00-519.fc43 100% | 495.8 KiB/s | 63.0 KiB | 00m00s [185/301] perl-doc-0:5.42.0-519.fc43.no 100% | 4.5 MiB/s | 5.0 MiB | 00m01s [186/301] perl-encoding-warnings-0:0.14 100% | 20.2 KiB/s | 16.8 KiB | 00m01s [187/301] perl-experimental-0:0.036-1.f 100% | 33.6 KiB/s | 27.1 KiB | 00m01s [188/301] perl-fields-0:2.27-519.fc43.n 100% | 34.1 KiB/s | 16.4 KiB | 00m00s [189/301] perl-filetest-0:1.03-519.fc43 100% | 29.9 KiB/s | 14.9 KiB | 00m00s [190/301] perl-if-0:0.61.000-519.fc43.n 100% | 27.8 KiB/s | 14.3 KiB | 00m01s [191/301] perl-less-0:0.03-519.fc43.noa 100% | 79.7 KiB/s | 13.5 KiB | 00m00s [192/301] perl-lib-0:0.65-519.fc43.x86_ 100% | 89.0 KiB/s | 15.2 KiB | 00m00s [193/301] perl-libnetcfg-4:5.42.0-519.f 100% | 172.8 KiB/s | 16.6 KiB | 00m00s [194/301] perl-libnet-0:3.15-520.fc43.n 100% | 467.3 KiB/s | 128.5 KiB | 00m00s [195/301] perl-locale-0:1.13-519.fc43.n 100% | 269.9 KiB/s | 13.8 KiB | 00m00s [196/301] perl-libs-4:5.42.0-519.fc43.x 100% | 3.4 MiB/s | 2.6 MiB | 00m01s [197/301] perl-macros-4:5.42.0-519.fc43 100% | 20.0 KiB/s | 12.6 KiB | 00m01s [198/301] perl-meta-notation-0:5.42.0-5 100% | 17.6 KiB/s | 10.9 KiB | 00m01s [199/301] perl-mro-0:1.29-519.fc43.x86_ 100% | 202.4 KiB/s | 30.2 KiB | 00m00s [200/301] perl-open-0:1.13-519.fc43.noa 100% | 88.4 KiB/s | 16.8 KiB | 00m00s [201/301] perl-overload-0:1.40-519.fc43 100% | 208.2 KiB/s | 45.8 KiB | 00m00s [202/301] perl-overloading-0:0.02-519.f 100% | 153.2 KiB/s | 13.2 KiB | 00m00s [203/301] perl-parent-1:0.244-519.fc43. 100% | 322.7 KiB/s | 14.8 KiB | 00m00s [204/301] perl-ph-0:5.42.0-519.fc43.x86 100% | 932.2 KiB/s | 51.3 KiB | 00m00s [205/301] perl-perlfaq-0:5.20250619-519 100% | 2.3 MiB/s | 378.8 KiB | 00m00s [206/301] perl-sigtrap-0:1.10-519.fc43. 100% | 173.0 KiB/s | 15.9 KiB | 00m00s [207/301] perl-podlators-1:6.0.2-519.fc 100% | 880.4 KiB/s | 128.5 KiB | 00m00s [208/301] perl-sort-0:2.06-519.fc43.noa 100% | 232.0 KiB/s | 13.5 KiB | 00m00s [209/301] perl-subs-0:1.04-519.fc43.noa 100% | 176.2 KiB/s | 12.0 KiB | 00m00s [210/301] perl-threads-1:2.43-519.fc43. 100% | 732.9 KiB/s | 57.9 KiB | 00m00s [211/301] perl-threads-shared-0:1.70-51 100% | 468.7 KiB/s | 44.5 KiB | 00m00s [212/301] perl-utils-0:5.42.0-519.fc43. 100% | 432.0 KiB/s | 52.7 KiB | 00m00s [213/301] perl-vars-0:1.05-519.fc43.noa 100% | 89.6 KiB/s | 13.3 KiB | 00m00s [214/301] perl-version-9:0.99.33-520.fc 100% | 386.6 KiB/s | 63.0 KiB | 00m00s [215/301] perl-vmsish-0:1.04-519.fc43.n 100% | 95.6 KiB/s | 14.3 KiB | 00m00s [216/301] numactl-libs-0:2.0.19-2.fc42. 100% | 98.3 KiB/s | 31.3 KiB | 00m00s [217/301] perl-MIME-Base32-0:1.303-23.f 100% | 88.0 KiB/s | 20.5 KiB | 00m00s [218/301] less-0:679-1.fc43.x86_64 100% | 503.5 KiB/s | 195.3 KiB | 00m00s [219/301] man-db-0:2.13.1-1.fc43.x86_64 100% | 3.9 MiB/s | 1.4 MiB | 00m00s [220/301] libdrm-0:2.4.125-1.fc43.x86_6 100% | 449.1 KiB/s | 161.2 KiB | 00m00s [221/301] perl-Text-Diff-0:1.45-23.fc42 100% | 607.5 KiB/s | 40.1 KiB | 00m00s [222/301] perl-IO-Compress-Lzma-0:2.213 100% | 323.7 KiB/s | 76.7 KiB | 00m00s [223/301] perl-Devel-Size-0:0.85-2.fc43 100% | 247.3 KiB/s | 30.7 KiB | 00m00s [224/301] perl-Archive-Zip-0:1.68-16.fc 100% | 331.8 KiB/s | 111.5 KiB | 00m00s [225/301] perl-Compress-Bzip2-0:2.28-23 100% | 239.4 KiB/s | 66.8 KiB | 00m00s [226/301] perl-File-HomeDir-0:1.006-14. 100% | 310.4 KiB/s | 59.3 KiB | 00m00s [227/301] perl-Text-Glob-0:0.11-25.fc42 100% | 25.9 KiB/s | 13.4 KiB | 00m01s [228/301] perl-Module-Build-2:0.42.34-8 100% | 399.8 KiB/s | 251.5 KiB | 00m01s [229/301] perl-Module-Signature-0:0.93- 100% | 139.5 KiB/s | 87.7 KiB | 00m01s [230/301] perl-local-lib-0:2.000029-9.f 100% | 308.6 KiB/s | 66.3 KiB | 00m00s [231/301] libdb-0:5.3.28-65.fc43.x86_64 100% | 3.6 MiB/s | 770.8 KiB | 00m00s [232/301] perl-IO-Socket-SSL-0:2.095-1. 100% | 1.0 MiB/s | 231.6 KiB | 00m00s [233/301] perl-Net-SSLeay-0:1.94-10.fc4 100% | 1.2 MiB/s | 375.0 KiB | 00m00s [234/301] groff-base-0:1.23.0-8.fc42.x8 100% | 3.3 MiB/s | 1.1 MiB | 00m00s [235/301] ncurses-0:6.5-6.20250614.fc43 100% | 955.8 KiB/s | 426.3 KiB | 00m00s [236/301] perl-IPC-System-Simple-0:1.30 100% | 160.2 KiB/s | 38.8 KiB | 00m00s [237/301] libxcrypt-devel-0:4.4.38-7.fc 100% | 172.8 KiB/s | 29.4 KiB | 00m00s [238/301] libpipeline-0:1.5.8-2.fc42.x8 100% | 314.3 KiB/s | 60.0 KiB | 00m00s [239/301] libpciaccess-0:0.16-15.fc42.x 100% | 134.1 KiB/s | 26.3 KiB | 00m00s [240/301] systemtap-sdt-dtrace-0:5.3-2. 100% | 201.9 KiB/s | 69.4 KiB | 00m00s [241/301] perl-Compress-Raw-Lzma-0:2.21 100% | 262.8 KiB/s | 51.5 KiB | 00m00s [242/301] perl-Algorithm-Diff-0:1.2010- 100% | 237.8 KiB/s | 46.4 KiB | 00m00s [243/301] perl-inc-latest-2:0.500-30.fc 100% | 122.7 KiB/s | 23.3 KiB | 00m00s [244/301] perl-Software-License-0:0.104 100% | 424.0 KiB/s | 148.0 KiB | 00m00s [245/301] glibc-devel-0:2.41.9000-23.fc 100% | 750.9 KiB/s | 562.4 KiB | 00m01s [246/301] python3-pyparsing-0:3.1.2-11. 100% | 368.7 KiB/s | 286.9 KiB | 00m01s [247/301] perl-Data-Section-0:0.200008- 100% | 128.5 KiB/s | 24.9 KiB | 00m00s [248/301] hwdata-0:0.397-1.fc43.noarch 100% | 2.0 MiB/s | 1.7 MiB | 00m01s [249/301] perl-Text-Template-0:1.61-7.f 100% | 328.5 KiB/s | 59.1 KiB | 00m00s [250/301] perl-MRO-Compat-0:0.15-11.fc4 100% | 136.1 KiB/s | 25.4 KiB | 00m00s [251/301] perl-Data-OptList-0:0.114-6.f 100% | 268.1 KiB/s | 26.8 KiB | 00m00s [252/301] perl-Package-Generator-0:1.10 100% | 200.2 KiB/s | 22.4 KiB | 00m00s [253/301] perl-Sub-Exporter-0:0.991-5.f 100% | 570.2 KiB/s | 77.5 KiB | 00m00s [254/301] perl-Params-Util-0:1.102-18.f 100% | 616.6 KiB/s | 32.7 KiB | 00m00s [255/301] perl-Sub-Install-0:0.929-7.fc 100% | 754.5 KiB/s | 22.6 KiB | 00m00s [256/301] python3-0:3.14.0~b4-1.fc43.x8 100% | 661.7 KiB/s | 27.1 KiB | 00m00s [257/301] mpdecimal-0:4.0.1-1.fc43.x86_ 100% | 172.7 KiB/s | 97.1 KiB | 00m01s [258/301] python3-libs-0:3.14.0~b4-1.fc 100% | 9.2 MiB/s | 9.8 MiB | 00m01s [259/301] python-pip-wheel-0:25.1.1-13. 100% | 1.0 MiB/s | 1.2 MiB | 00m01s [260/301] tzdata-0:2025b-1.fc43.noarch 100% | 1.0 MiB/s | 714.0 KiB | 00m01s [261/301] perl-Encode-4:3.21-519.fc43.x 100% | 3.4 MiB/s | 1.1 MiB | 00m00s [262/301] perl-Encode-devel-4:3.21-519. 100% | 250.4 KiB/s | 41.1 KiB | 00m00s [263/301] systemtap-sdt-devel-0:5.3-2.f 100% | 272.6 KiB/s | 68.7 KiB | 00m00s [264/301] kernel-headers-0:6.16.0-0.rc7 100% | 3.6 MiB/s | 1.7 MiB | 00m00s [265/301] procps-ng-0:4.0.4-6.fc42.x86_ 100% | 826.5 KiB/s | 365.3 KiB | 00m00s [266/301] rocm-smi-0:6.4.2-1.fc43.x86_6 100% | 9.2 MiB/s | 604.0 KiB | 00m00s [267/301] tcl-1:9.0.2-1.fc43.x86_64 100% | 2.2 MiB/s | 1.2 MiB | 00m01s [268/301] hipcc-0:19-12.rocm6.4.2.fc43. 100% | 6.2 MiB/s | 134.2 KiB | 00m00s [269/301] libtommath-0:1.3.1~rc1-5.fc42 100% | 337.0 KiB/s | 64.4 KiB | 00m00s [270/301] libdrm-devel-0:2.4.125-1.fc43 100% | 1.9 MiB/s | 183.4 KiB | 00m00s [271/301] rocm-device-libs-0:19-12.rocm 100% | 21.8 MiB/s | 490.2 KiB | 00m00s [272/301] rocm-clang-devel-0:19-12.rocm 100% | 30.9 MiB/s | 2.4 MiB | 00m00s [273/301] rocm-clang-0:19-12.rocm6.4.2. 100% | 59.0 MiB/s | 16.0 MiB | 00m00s [274/301] rocm-clang-runtime-devel-0:19 100% | 1.7 MiB/s | 492.9 KiB | 00m00s [275/301] rocm-clang-libs-0:19-12.rocm6 100% | 49.5 MiB/s | 22.8 MiB | 00m00s [276/301] rocm-libc++-devel-0:19-12.roc 100% | 4.3 MiB/s | 904.2 KiB | 00m00s [277/301] git-0:2.50.1-1.fc43.x86_64 100% | 398.4 KiB/s | 51.0 KiB | 00m00s [278/301] rocm-libc++-0:19-12.rocm6.4.2 100% | 8.7 MiB/s | 346.3 KiB | 00m00s [279/301] rocm-llvm-libs-0:19-12.rocm6. 100% | 82.6 MiB/s | 20.2 MiB | 00m00s [280/301] perl-Git-0:2.50.1-1.fc43.noar 100% | 84.6 KiB/s | 37.8 KiB | 00m00s [281/301] git-core-0:2.50.1-1.fc43.x86_ 100% | 6.2 MiB/s | 5.0 MiB | 00m01s [282/301] rocm-llvm-filesystem-0:19-12. 100% | 1.2 MiB/s | 24.6 KiB | 00m00s [283/301] git-core-doc-0:2.50.1-1.fc43. 100% | 2.9 MiB/s | 3.1 MiB | 00m01s [284/301] perl-TermReadKey-0:2.38-25.fc 100% | 87.8 KiB/s | 35.3 KiB | 00m00s [285/301] perl-Error-1:0.17030-1.fc43.n 100% | 125.5 KiB/s | 40.4 KiB | 00m00s [286/301] openssh-clients-0:10.0p1-4.fc 100% | 1.1 MiB/s | 747.0 KiB | 00m01s [287/301] libedit-0:3.1-55.20250104cvs. 100% | 217.1 KiB/s | 105.3 KiB | 00m00s [288/301] rocm-lld-0:19-12.rocm6.4.2.fc 100% | 41.4 MiB/s | 1.5 MiB | 00m00s [289/301] libfido2-0:1.16.0-2.fc43.x86_ 100% | 455.8 KiB/s | 98.5 KiB | 00m00s [290/301] openssh-0:10.0p1-4.fc43.x86_6 100% | 1.4 MiB/s | 339.7 KiB | 00m00s [291/301] libcbor-0:0.12.0-5.fc43.x86_6 100% | 279.2 KiB/s | 33.5 KiB | 00m00s [292/301] rocm-llvm-devel-0:19-12.rocm6 100% | 16.9 MiB/s | 3.8 MiB | 00m00s [293/301] rocm-llvm-static-0:19-12.rocm 100% | 59.2 MiB/s | 29.4 MiB | 00m00s [294/301] rocm-core-0:6.4.2-1.fc43.x86_ 100% | 84.4 KiB/s | 13.6 KiB | 00m00s [295/301] rocm-llvm-0:19-12.rocm6.4.2.f 100% | 32.5 MiB/s | 13.1 MiB | 00m00s [296/301] gcc-plugin-annobin-0:15.1.1-3 100% | 5.8 MiB/s | 53.6 KiB | 00m00s [297/301] libpciaccess-devel-0:0.16-15. 100% | 128.2 KiB/s | 12.4 KiB | 00m00s [298/301] zlib-ng-compat-devel-0:2.2.4- 100% | 281.9 KiB/s | 38.3 KiB | 00m00s [299/301] cmake-rpm-macros-0:3.31.6-3.f 100% | 56.3 KiB/s | 15.8 KiB | 00m00s [300/301] annobin-plugin-gcc-0:12.98-1. 100% | 2.0 MiB/s | 997.1 KiB | 00m00s [301/301] annobin-docs-0:12.98-1.fc43.n 100% | 208.2 KiB/s | 90.2 KiB | 00m00s -------------------------------------------------------------------------------- [301/301] Total 100% | 11.3 MiB/s | 295.4 MiB | 00m26s Running transaction [ 1/303] Verify package files 100% | 235.0 B/s | 301.0 B | 00m01s [ 2/303] Prepare transaction 100% | 1.3 KiB/s | 301.0 B | 00m00s [ 3/303] Installing cmake-filesystem-0 100% | 1.9 MiB/s | 7.6 KiB | 00m00s [ 4/303] Installing less-0:679-1.fc43. 100% | 21.0 MiB/s | 409.4 KiB | 00m00s [ 5/303] Installing libmpc-0:1.3.1-7.f 100% | 81.1 MiB/s | 166.1 KiB | 00m00s [ 6/303] Installing make-1:4.4.1-10.fc 100% | 66.7 MiB/s | 1.8 MiB | 00m00s [ 7/303] Installing expat-0:2.7.1-1.fc 100% | 18.1 MiB/s | 296.3 KiB | 00m00s [ 8/303] Installing rocm-llvm-filesyst 100% | 2.6 MiB/s | 18.5 KiB | 00m00s [ 9/303] Installing rocm-libc++-0:19-1 100% | 32.4 MiB/s | 1.2 MiB | 00m00s [ 10/303] Installing rocm-llvm-libs-0:1 100% | 65.6 MiB/s | 84.8 MiB | 00m01s [ 11/303] Installing rocm-clang-libs-0: 100% | 66.3 MiB/s | 98.4 MiB | 00m01s [ 12/303] Installing kernel-headers-0:6 100% | 98.9 MiB/s | 6.8 MiB | 00m00s [ 13/303] Installing libxcrypt-devel-0: 100% | 10.8 MiB/s | 33.1 KiB | 00m00s [ 14/303] Installing glibc-devel-0:2.41 100% | 45.9 MiB/s | 2.3 MiB | 00m00s [ 15/303] Installing groff-base-0:1.23. 100% | 69.5 MiB/s | 3.9 MiB | 00m00s [ 16/303] Installing numactl-libs-0:2.0 100% | 26.3 MiB/s | 53.8 KiB | 00m00s [ 17/303] Installing vim-filesystem-2:9 100% | 2.3 MiB/s | 4.7 KiB | 00m00s [ 18/303] Installing rocm-comgr-0:19-12 100% | 61.6 MiB/s | 123.9 MiB | 00m02s [ 19/303] Installing rocm-lld-0:19-12.r 100% | 59.8 MiB/s | 5.7 MiB | 00m00s [ 20/303] Installing rocm-libc++-devel- 100% | 60.7 MiB/s | 7.7 MiB | 00m00s [ 21/303] Installing cpp-0:15.1.1-3.fc4 100% | 259.6 MiB/s | 37.9 MiB | 00m00s [ 22/303] Installing gcc-0:15.1.1-3.fc4 100% | 288.9 MiB/s | 111.2 MiB | 00m00s [ 23/303] Installing zlib-ng-compat-dev 100% | 53.0 MiB/s | 108.5 KiB | 00m00s [ 24/303] Installing annobin-docs-0:12. 100% | 97.7 MiB/s | 100.1 KiB | 00m00s [ 25/303] Installing rocm-core-0:6.4.2- 100% | 13.2 MiB/s | 13.5 KiB | 00m00s [ 26/303] Installing libcbor-0:0.12.0-5 100% | 77.3 MiB/s | 79.2 KiB | 00m00s [ 27/303] Installing libfido2-0:1.16.0- 100% | 117.2 MiB/s | 240.0 KiB | 00m00s [ 28/303] Installing openssh-0:10.0p1-4 100% | 73.3 MiB/s | 1.4 MiB | 00m00s [ 29/303] Installing libedit-0:3.1-55.2 100% | 80.0 MiB/s | 245.8 KiB | 00m00s [ 30/303] Installing openssh-clients-0: 100% | 74.5 MiB/s | 2.6 MiB | 00m00s [ 31/303] Installing git-core-0:2.50.1- 100% | 253.1 MiB/s | 23.5 MiB | 00m00s [ 32/303] Installing git-core-doc-0:2.5 100% | 183.1 MiB/s | 17.9 MiB | 00m00s [ 33/303] Installing rocm-clang-runtime 100% | 105.3 MiB/s | 6.9 MiB | 00m00s [ 34/303] Installing libtommath-0:1.3.1 100% | 64.2 MiB/s | 131.5 KiB | 00m00s [ 35/303] Installing tcl-1:9.0.2-1.fc43 100% | 114.1 MiB/s | 4.3 MiB | 00m00s [ 36/303] Installing procps-ng-0:4.0.4- 100% | 48.1 MiB/s | 1.0 MiB | 00m00s [ 37/303] Installing systemtap-sdt-deve 100% | 36.0 MiB/s | 184.3 KiB | 00m00s [ 38/303] Installing tzdata-0:2025b-1.f 100% | 24.9 MiB/s | 1.9 MiB | 00m00s [ 39/303] Installing python-pip-wheel-0 100% | 311.3 MiB/s | 1.2 MiB | 00m00s [ 40/303] Installing mpdecimal-0:4.0.1- 100% | 30.5 MiB/s | 218.8 KiB | 00m00s [ 41/303] Installing python3-libs-0:3.1 100% | 199.3 MiB/s | 43.3 MiB | 00m00s [ 42/303] Installing python3-0:3.14.0~b 100% | 2.0 MiB/s | 30.7 KiB | 00m00s [ 43/303] Installing cmake-rpm-macros-0 100% | 8.1 MiB/s | 8.3 KiB | 00m00s [ 44/303] Installing python3-pyparsing- 100% | 171.6 MiB/s | 1.0 MiB | 00m00s [ 45/303] Installing systemtap-sdt-dtra 100% | 11.8 MiB/s | 180.9 KiB | 00m00s [ 46/303] Installing rocm-smi-0:6.4.2-1 100% | 120.7 MiB/s | 2.7 MiB | 00m00s [ 47/303] Installing hwdata-0:0.397-1.f 100% | 341.5 MiB/s | 9.6 MiB | 00m00s [ 48/303] Installing libpciaccess-0:0.1 100% | 44.8 MiB/s | 45.9 KiB | 00m00s [ 49/303] Installing libdrm-0:2.4.125-1 100% | 97.6 MiB/s | 399.7 KiB | 00m00s [ 50/303] Installing rocm-runtime-0:6.4 100% | 341.7 MiB/s | 3.1 MiB | 00m00s [ 51/303] Installing rocm-runtime-devel 100% | 187.2 MiB/s | 574.9 KiB | 00m00s [ 52/303] Installing rocm-llvm-0:19-12. 100% | 61.2 MiB/s | 48.5 MiB | 00m01s [ 53/303] Installing rocm-llvm-devel-0: 100% | 66.7 MiB/s | 25.7 MiB | 00m00s [ 54/303] Installing rocm-llvm-static-0 100% | 93.2 MiB/s | 250.3 MiB | 00m03s [ 55/303] Installing libpciaccess-devel 100% | 15.5 MiB/s | 15.9 KiB | 00m00s [ 56/303] Installing libdrm-devel-0:2.4 100% | 120.1 MiB/s | 737.9 KiB | 00m00s [ 57/303] Installing libpipeline-0:1.5. 100% | 7.2 MiB/s | 146.6 KiB | 00m00s [ 58/303] Installing man-db-0:2.13.1-1. 100% | 49.4 MiB/s | 2.9 MiB | 00m00s [ 59/303] Installing environment-module 100% | 39.2 MiB/s | 1.8 MiB | 00m00s [ 60/303] Installing ncurses-0:6.5-6.20 100% | 31.7 MiB/s | 616.4 KiB | 00m00s [ 61/303] Installing perl-Digest-0:1.20 100% | 36.2 MiB/s | 37.1 KiB | 00m00s [ 62/303] Installing perl-FileHandle-0: 100% | 9.6 MiB/s | 9.8 KiB | 00m00s [ 63/303] Installing perl-B-0:1.89-519. 100% | 123.2 MiB/s | 504.7 KiB | 00m00s [ 64/303] Installing perl-Digest-MD5-0: 100% | 30.1 MiB/s | 61.6 KiB | 00m00s [ 65/303] Installing perl-MIME-Base32-0 100% | 31.4 MiB/s | 32.2 KiB | 00m00s [ 66/303] Installing perl-libnet-0:3.15 100% | 95.9 MiB/s | 294.7 KiB | 00m00s [ 67/303] Installing perl-Data-Dumper-0 100% | 57.4 MiB/s | 117.5 KiB | 00m00s [ 68/303] Installing perl-URI-0:5.32-1. 100% | 44.6 MiB/s | 274.1 KiB | 00m00s [ 69/303] Installing perl-IO-Socket-IP- 100% | 49.9 MiB/s | 102.2 KiB | 00m00s [ 70/303] Installing perl-AutoLoader-0: 100% | 20.5 MiB/s | 21.0 KiB | 00m00s [ 71/303] Installing perl-Net-SSLeay-0: 100% | 123.5 MiB/s | 1.4 MiB | 00m00s [ 72/303] Installing perl-IO-Socket-SSL 100% | 140.3 MiB/s | 718.6 KiB | 00m00s [ 73/303] Installing perl-Pod-Escapes-1 100% | 25.3 MiB/s | 25.9 KiB | 00m00s [ 74/303] Installing perl-File-Path-0:2 100% | 63.0 MiB/s | 64.5 KiB | 00m00s [ 75/303] Installing perl-Time-Local-2: 100% | 68.9 MiB/s | 70.6 KiB | 00m00s [ 76/303] Installing perl-locale-0:1.13 100% | 6.4 MiB/s | 6.5 KiB | 00m00s [ 77/303] Installing perl-if-0:0.61.000 100% | 6.1 MiB/s | 6.2 KiB | 00m00s [ 78/303] Installing perl-Text-Tabs+Wra 100% | 23.3 MiB/s | 23.9 KiB | 00m00s [ 79/303] Installing perl-Pod-Simple-1: 100% | 112.3 MiB/s | 574.8 KiB | 00m00s [ 80/303] Installing perl-HTTP-Tiny-0:0 100% | 76.4 MiB/s | 156.4 KiB | 00m00s [ 81/303] Installing perl-Term-Cap-0:1. 100% | 29.9 MiB/s | 30.6 KiB | 00m00s [ 82/303] Installing perl-File-Temp-1:0 100% | 80.1 MiB/s | 164.1 KiB | 00m00s [ 83/303] Installing perl-IPC-Open3-0:1 100% | 27.8 MiB/s | 28.5 KiB | 00m00s [ 84/303] Installing perl-POSIX-0:2.23- 100% | 113.6 MiB/s | 232.6 KiB | 00m00s [ 85/303] Installing perl-Term-ANSIColo 100% | 96.9 MiB/s | 99.2 KiB | 00m00s [ 86/303] Installing perl-Class-Struct- 100% | 25.3 MiB/s | 25.9 KiB | 00m00s [ 87/303] Installing perl-podlators-1:6 100% | 19.6 MiB/s | 321.4 KiB | 00m00s [ 88/303] Installing perl-Pod-Perldoc-0 100% | 10.3 MiB/s | 169.2 KiB | 00m00s [ 89/303] Installing perl-File-stat-0:1 100% | 12.8 MiB/s | 13.1 KiB | 00m00s [ 90/303] Installing perl-Symbol-0:1.09 100% | 7.1 MiB/s | 7.3 KiB | 00m00s [ 91/303] Installing perl-SelectSaver-0 100% | 2.6 MiB/s | 2.6 KiB | 00m00s [ 92/303] Installing perl-Socket-4:2.04 100% | 59.7 MiB/s | 122.3 KiB | 00m00s [ 93/303] Installing perl-Pod-Usage-4:2 100% | 5.7 MiB/s | 87.9 KiB | 00m00s [ 94/303] Installing perl-overloading-0 100% | 5.4 MiB/s | 5.6 KiB | 00m00s [ 95/303] Installing perl-IO-0:1.55-519 100% | 49.4 MiB/s | 151.7 KiB | 00m00s [ 96/303] Installing perl-mro-0:1.29-51 100% | 41.7 MiB/s | 42.7 KiB | 00m00s [ 97/303] Installing perl-base-0:2.27-5 100% | 12.7 MiB/s | 13.0 KiB | 00m00s [ 98/303] Installing perl-Text-ParseWor 100% | 14.2 MiB/s | 14.6 KiB | 00m00s [ 99/303] Installing perl-Fcntl-0:1.20- 100% | 48.7 MiB/s | 49.9 KiB | 00m00s [100/303] Installing perl-Getopt-Long-1 100% | 71.9 MiB/s | 147.2 KiB | 00m00s [101/303] Installing perl-vars-0:1.05-5 100% | 4.2 MiB/s | 4.3 KiB | 00m00s [102/303] Installing perl-parent-1:0.24 100% | 10.7 MiB/s | 11.0 KiB | 00m00s [103/303] Installing perl-overload-0:1. 100% | 70.3 MiB/s | 72.0 KiB | 00m00s [104/303] Installing perl-Storable-1:3. 100% | 113.7 MiB/s | 232.8 KiB | 00m00s [105/303] Installing perl-constant-0:1. 100% | 26.7 MiB/s | 27.4 KiB | 00m00s [106/303] Installing perl-MIME-Base64-0 100% | 21.6 MiB/s | 44.3 KiB | 00m00s [107/303] Installing perl-Errno-0:1.38- 100% | 8.6 MiB/s | 8.8 KiB | 00m00s [108/303] Installing perl-File-Basename 100% | 14.3 MiB/s | 14.6 KiB | 00m00s [109/303] Installing perl-Scalar-List-U 100% | 48.3 MiB/s | 148.5 KiB | 00m00s [110/303] Installing perl-Getopt-Std-0: 100% | 11.5 MiB/s | 11.8 KiB | 00m00s [111/303] Installing perl-Encode-4:3.21 100% | 126.9 MiB/s | 4.7 MiB | 00m00s [112/303] Installing perl-DynaLoader-0: 100% | 31.7 MiB/s | 32.5 KiB | 00m00s [113/303] Installing perl-PathTools-0:3 100% | 60.1 MiB/s | 184.6 KiB | 00m00s [114/303] Installing perl-Exporter-0:5. 100% | 54.3 MiB/s | 55.6 KiB | 00m00s [115/303] Installing perl-Carp-0:1.54-5 100% | 15.5 MiB/s | 47.7 KiB | 00m00s [116/303] Installing perl-libs-4:5.42.0 100% | 155.3 MiB/s | 11.6 MiB | 00m00s [117/303] Installing perl-interpreter-4 100% | 7.8 MiB/s | 120.3 KiB | 00m00s [118/303] Installing perl-File-Find-0:1 100% | 41.5 MiB/s | 42.5 KiB | 00m00s [119/303] Installing perl-version-9:0.9 100% | 64.2 MiB/s | 131.5 KiB | 00m00s [120/303] Installing perl-File-Copy-0:2 100% | 19.7 MiB/s | 20.2 KiB | 00m00s [121/303] Installing perl-ExtUtils-Mani 100% | 84.3 MiB/s | 86.3 KiB | 00m00s [122/303] Installing perl-lib-0:0.65-51 100% | 8.7 MiB/s | 8.9 KiB | 00m00s [123/303] Installing perl-threads-1:2.4 100% | 57.2 MiB/s | 117.1 KiB | 00m00s [124/303] Installing perl-threads-share 100% | 41.9 MiB/s | 85.9 KiB | 00m00s [125/303] Installing perl-Compress-Raw- 100% | 80.8 MiB/s | 165.5 KiB | 00m00s [126/303] Installing perl-File-Compare- 100% | 6.0 MiB/s | 6.2 KiB | 00m00s [127/303] Installing perl-Time-HiRes-4: 100% | 57.5 MiB/s | 117.8 KiB | 00m00s [128/303] Installing perl-CPAN-Meta-Req 100% | 40.7 MiB/s | 83.4 KiB | 00m00s [129/303] Installing perl-Module-CoreLi 100% | 308.7 MiB/s | 1.2 MiB | 00m00s [130/303] Installing perl-Module-Metada 100% | 67.4 MiB/s | 69.0 KiB | 00m00s [131/303] Installing perl-Digest-SHA-1: 100% | 7.0 MiB/s | 115.0 KiB | 00m00s [132/303] Installing perl-Filter-2:1.64 100% | 32.5 MiB/s | 166.2 KiB | 00m00s [133/303] Installing perl-Module-Load-1 100% | 15.5 MiB/s | 15.9 KiB | 00m00s [134/303] Installing perl-Perl-OSType-0 100% | 33.5 MiB/s | 34.3 KiB | 00m00s [135/303] Installing perl-Term-ReadLine 100% | 17.4 MiB/s | 17.9 KiB | 00m00s [136/303] Installing perl-Tie-0:4.6-519 100% | 33.1 MiB/s | 33.9 KiB | 00m00s [137/303] Installing perl-Unicode-Norma 100% | 159.0 MiB/s | 488.4 KiB | 00m00s [138/303] Installing perl-meta-notation 100% | 0.0 B/s | 2.3 KiB | 00m00s [139/303] Installing perl-encoding-4:3. 100% | 146.9 MiB/s | 150.4 KiB | 00m00s [140/303] Installing perl-Net-Ping-0:2. 100% | 66.1 MiB/s | 135.3 KiB | 00m00s [141/303] Installing perl-ExtUtils-Comm 100% | 9.9 MiB/s | 10.2 KiB | 00m00s [142/303] Installing perl-Pod-Html-0:1. 100% | 2.9 MiB/s | 43.9 KiB | 00m00s [143/303] Installing perl-File-Which-0: 100% | 30.7 MiB/s | 31.4 KiB | 00m00s [144/303] Installing perl-AutoSplit-0:5 100% | 23.0 MiB/s | 23.6 KiB | 00m00s [145/303] Installing perl-Benchmark-0:1 100% | 36.0 MiB/s | 36.8 KiB | 00m00s [146/303] Installing perl-Test-Harness- 100% | 23.7 MiB/s | 583.6 KiB | 00m00s [147/303] Installing perl-CPAN-Meta-YAM 100% | 52.3 MiB/s | 53.5 KiB | 00m00s [148/303] Installing perl-Compress-Raw- 100% | 34.0 MiB/s | 69.6 KiB | 00m00s [149/303] Installing perl-IO-Compress-0 100% | 49.1 MiB/s | 1.0 MiB | 00m00s [150/303] Installing perl-IO-Zlib-1:1.1 100% | 2.9 MiB/s | 26.7 KiB | 00m00s [151/303] Installing perl-Devel-PPPort- 100% | 217.8 MiB/s | 892.1 KiB | 00m00s [152/303] Installing perl-DirHandle-0:1 100% | 0.0 B/s | 3.8 KiB | 00m00s [153/303] Installing perl-Dumpvalue-0:2 100% | 19.7 MiB/s | 20.2 KiB | 00m00s [154/303] Installing perl-ExtUtils-Cons 100% | 85.7 MiB/s | 87.7 KiB | 00m00s [155/303] Installing perl-ExtUtils-MM-U 100% | 3.6 MiB/s | 3.7 KiB | 00m00s [156/303] Installing perl-Hash-Util-Fie 100% | 31.4 MiB/s | 64.3 KiB | 00m00s [157/303] Installing perl-Hash-Util-0:0 100% | 55.1 MiB/s | 56.4 KiB | 00m00s [158/303] Installing perl-fields-0:2.27 100% | 12.0 MiB/s | 12.3 KiB | 00m00s [159/303] Installing perl-ExtUtils-Pars 100% | 28.0 MiB/s | 545.5 KiB | 00m00s [160/303] Installing perl-ExtUtils-Make 100% | 38.6 MiB/s | 750.3 KiB | 00m00s [161/303] Installing perl-ExtUtils-Inst 100% | 85.1 MiB/s | 87.2 KiB | 00m00s [162/303] Installing perl-devel-4:5.42. 100% | 136.0 MiB/s | 3.8 MiB | 00m00s [163/303] Installing perl-ExtUtils-Embe 100% | 15.7 MiB/s | 16.1 KiB | 00m00s [164/303] Installing perl-I18N-LangTags 100% | 81.8 MiB/s | 83.8 KiB | 00m00s [165/303] Installing perl-Locale-Makete 100% | 84.9 MiB/s | 173.9 KiB | 00m00s [166/303] Installing perl-Locale-Makete 100% | 13.2 MiB/s | 13.5 KiB | 00m00s [167/303] Installing perl-Params-Check- 100% | 27.9 MiB/s | 28.6 KiB | 00m00s [168/303] Installing perl-Module-Load-C 100% | 29.2 MiB/s | 29.9 KiB | 00m00s [169/303] Installing perl-IPC-Cmd-2:1.0 100% | 83.9 MiB/s | 85.9 KiB | 00m00s [170/303] Installing perl-Math-Complex- 100% | 84.0 MiB/s | 86.0 KiB | 00m00s [171/303] Installing perl-Math-BigInt-1 100% | 212.8 MiB/s | 1.1 MiB | 00m00s [172/303] Installing perl-JSON-PP-1:4.1 100% | 8.8 MiB/s | 143.6 KiB | 00m00s [173/303] Installing perl-CPAN-Meta-0:2 100% | 66.6 MiB/s | 613.8 KiB | 00m00s [174/303] Installing perl-NDBM_File-0:1 100% | 28.9 MiB/s | 29.6 KiB | 00m00s [175/303] Installing perl-SelfLoader-0: 100% | 22.1 MiB/s | 22.6 KiB | 00m00s [176/303] Installing perl-Sys-Hostname- 100% | 16.8 MiB/s | 17.2 KiB | 00m00s [177/303] Installing perl-Term-Table-0: 100% | 39.6 MiB/s | 81.0 KiB | 00m00s [178/303] Installing perl-Text-Balanced 100% | 110.1 MiB/s | 112.7 KiB | 00m00s [179/303] Installing perl-Tie-RefHash-0 100% | 36.5 MiB/s | 37.4 KiB | 00m00s [180/303] Installing perl-User-pwent-0: 100% | 17.5 MiB/s | 17.9 KiB | 00m00s [181/303] Installing perl-autouse-0:1.1 100% | 0.0 B/s | 6.4 KiB | 00m00s [182/303] Installing perl-subs-0:1.04-5 100% | 0.0 B/s | 2.5 KiB | 00m00s [183/303] Installing perl-Opcode-0:1.69 100% | 48.7 MiB/s | 49.8 KiB | 00m00s [184/303] Installing perl-Safe-0:2.47-5 100% | 30.3 MiB/s | 31.1 KiB | 00m00s [185/303] Installing perl-Params-Util-0 100% | 29.8 MiB/s | 61.0 KiB | 00m00s [186/303] Installing perl-Sub-Install-0 100% | 36.3 MiB/s | 37.2 KiB | 00m00s [187/303] Installing perl-Data-OptList- 100% | 51.0 MiB/s | 52.2 KiB | 00m00s [188/303] Installing perl-Filter-Simple 100% | 25.3 MiB/s | 51.7 KiB | 00m00s [189/303] Installing perl-Test-Simple-3 100% | 68.1 MiB/s | 1.8 MiB | 00m00s [190/303] Installing perl-Devel-SelfStu 100% | 7.2 MiB/s | 7.3 KiB | 00m00s [191/303] Installing perl-Memoize-0:1.1 100% | 65.2 MiB/s | 66.8 KiB | 00m00s [192/303] Installing perl-Math-BigInt-F 100% | 22.9 MiB/s | 46.9 KiB | 00m00s [193/303] Installing perl-bignum-0:0.67 100% | 66.6 MiB/s | 136.5 KiB | 00m00s [194/303] Installing perl-File-Fetch-0: 100% | 59.9 MiB/s | 61.3 KiB | 00m00s [195/303] Installing perl-ExtUtils-Mini 100% | 8.6 MiB/s | 8.8 KiB | 00m00s [196/303] Installing perl-inc-latest-2: 100% | 35.5 MiB/s | 36.3 KiB | 00m00s [197/303] Installing perl-libnetcfg-4:5 100% | 1.2 MiB/s | 17.3 KiB | 00m00s [198/303] Installing perl-DBM_Filter-0: 100% | 30.0 MiB/s | 30.7 KiB | 00m00s [199/303] Installing perl-File-HomeDir- 100% | 60.5 MiB/s | 123.8 KiB | 00m00s [200/303] Installing perl-open-0:1.13-5 100% | 0.0 B/s | 11.7 KiB | 00m00s [201/303] Installing perl-debugger-0:1. 100% | 197.4 MiB/s | 404.3 KiB | 00m00s [202/303] Installing perl-sigtrap-0:1.1 100% | 11.2 MiB/s | 11.5 KiB | 00m00s [203/303] Installing perl-Unicode-Colla 100% | 233.1 MiB/s | 4.2 MiB | 00m00s [204/303] Installing perl-Unicode-UCD-0 100% | 202.1 MiB/s | 206.9 KiB | 00m00s [205/303] Installing perl-Env-0:1.06-51 100% | 26.6 MiB/s | 27.2 KiB | 00m00s [206/303] Installing perl-Module-CoreLi 100% | 1.3 MiB/s | 19.3 KiB | 00m00s [207/303] Installing perl-Archive-Zip-0 100% | 17.1 MiB/s | 297.8 KiB | 00m00s [208/303] Installing perl-Thread-0:3.06 100% | 12.2 MiB/s | 12.5 KiB | 00m00s [209/303] Installing perl-Thread-Queue- 100% | 29.7 MiB/s | 30.4 KiB | 00m00s [210/303] Installing perl-Thread-Semaph 100% | 10.4 MiB/s | 10.6 KiB | 00m00s [211/303] Installing perl-experimental- 100% | 43.8 MiB/s | 44.8 KiB | 00m00s [212/303] Installing perl-Encode-devel- 100% | 5.5 MiB/s | 101.1 KiB | 00m00s [213/303] Installing perl-Pod-Checker-4 100% | 3.7 MiB/s | 53.5 KiB | 00m00s [214/303] Installing perl-diagnostics-0 100% | 30.7 MiB/s | 472.1 KiB | 00m00s [215/303] Installing perl-macros-4:5.42 100% | 0.0 B/s | 5.8 KiB | 00m00s [216/303] Installing perl-utils-0:5.42. 100% | 6.9 MiB/s | 98.6 KiB | 00m00s [217/303] Installing perl-Attribute-Han 100% | 39.6 MiB/s | 40.5 KiB | 00m00s [218/303] Installing perl-Config-Extens 100% | 3.2 MiB/s | 3.2 KiB | 00m00s [219/303] Installing perl-Config-Perl-V 100% | 26.9 MiB/s | 27.5 KiB | 00m00s [220/303] Installing perl-Devel-Peek-0: 100% | 43.8 MiB/s | 44.9 KiB | 00m00s [221/303] Installing perl-English-0:1.1 100% | 0.0 B/s | 6.7 KiB | 00m00s [222/303] Installing perl-File-DosGlob- 100% | 21.7 MiB/s | 22.2 KiB | 00m00s [223/303] Installing perl-FileCache-0:1 100% | 0.0 B/s | 7.9 KiB | 00m00s [224/303] Installing perl-FindBin-0:1.5 100% | 7.0 MiB/s | 7.2 KiB | 00m00s [225/303] Installing perl-GDBM_File-1:1 100% | 78.9 MiB/s | 80.8 KiB | 00m00s [226/303] Installing perl-I18N-Collate- 100% | 7.5 MiB/s | 7.6 KiB | 00m00s [227/303] Installing perl-I18N-Langinfo 100% | 35.3 MiB/s | 36.2 KiB | 00m00s [228/303] Installing perl-IPC-SysV-0:2. 100% | 37.4 MiB/s | 76.7 KiB | 00m00s [229/303] Installing perl-Module-Loaded 100% | 5.4 MiB/s | 5.6 KiB | 00m00s [230/303] Installing perl-NEXT-0:0.69-5 100% | 23.4 MiB/s | 24.0 KiB | 00m00s [231/303] Installing perl-Net-0:1.04-51 100% | 23.3 MiB/s | 23.9 KiB | 00m00s [232/303] Installing perl-ODBM_File-0:1 100% | 29.0 MiB/s | 29.7 KiB | 00m00s [233/303] Installing perl-PerlIO-via-Qu 100% | 31.4 MiB/s | 32.1 KiB | 00m00s [234/303] Installing perl-Pod-Functions 100% | 0.0 B/s | 14.8 KiB | 00m00s [235/303] Installing perl-Search-Dict-0 100% | 5.1 MiB/s | 5.2 KiB | 00m00s [236/303] Installing perl-Sys-Syslog-0: 100% | 47.3 MiB/s | 96.9 KiB | 00m00s [237/303] Installing perl-Term-Complete 100% | 6.2 MiB/s | 6.3 KiB | 00m00s [238/303] Installing perl-Test-0:1.31-5 100% | 36.5 MiB/s | 37.4 KiB | 00m00s [239/303] Installing perl-Text-Abbrev-0 100% | 3.5 MiB/s | 3.6 KiB | 00m00s [240/303] Installing perl-Tie-File-0:1. 100% | 84.1 MiB/s | 86.2 KiB | 00m00s [241/303] Installing perl-Tie-Memoize-0 100% | 6.6 MiB/s | 6.8 KiB | 00m00s [242/303] Installing perl-Time-0:1.04-5 100% | 10.7 MiB/s | 10.9 KiB | 00m00s [243/303] Installing perl-Time-Piece-0: 100% | 35.6 MiB/s | 72.9 KiB | 00m00s [244/303] Installing perl-blib-0:1.07-5 100% | 0.0 B/s | 3.6 KiB | 00m00s [245/303] Installing perl-deprecate-0:0 100% | 6.8 MiB/s | 7.0 KiB | 00m00s [246/303] Installing perl-doc-0:5.42.0- 100% | 250.3 MiB/s | 11.5 MiB | 00m00s [247/303] Installing perl-encoding-warn 100% | 10.4 MiB/s | 10.7 KiB | 00m00s [248/303] Installing perl-filetest-0:1. 100% | 6.7 MiB/s | 6.8 KiB | 00m00s [249/303] Installing perl-less-0:0.03-5 100% | 5.2 MiB/s | 5.3 KiB | 00m00s [250/303] Installing perl-perlfaq-0:5.2 100% | 180.1 MiB/s | 737.9 KiB | 00m00s [251/303] Installing perl-ph-0:5.42.0-5 100% | 91.7 MiB/s | 281.8 KiB | 00m00s [252/303] Installing perl-sort-0:2.06-5 100% | 5.1 MiB/s | 5.2 KiB | 00m00s [253/303] Installing perl-vmsish-0:1.04 100% | 0.0 B/s | 7.0 KiB | 00m00s [254/303] Installing perl-Compress-Bzip 100% | 70.9 MiB/s | 145.3 KiB | 00m00s [255/303] Installing perl-Devel-Size-0: 100% | 42.8 MiB/s | 43.8 KiB | 00m00s [256/303] Installing perl-Text-Glob-0:0 100% | 9.1 MiB/s | 9.3 KiB | 00m00s [257/303] Installing perl-local-lib-0:2 100% | 58.8 MiB/s | 120.4 KiB | 00m00s [258/303] Installing perl-IPC-System-Si 100% | 35.9 MiB/s | 73.5 KiB | 00m00s [259/303] Installing perl-autodie-0:2.3 100% | 71.3 MiB/s | 219.1 KiB | 00m00s [260/303] Installing perl-Compress-Raw- 100% | 60.2 MiB/s | 123.3 KiB | 00m00s [261/303] Installing perl-IO-Compress-L 100% | 71.7 MiB/s | 220.4 KiB | 00m00s [262/303] Installing perl-Algorithm-Dif 100% | 106.9 MiB/s | 109.5 KiB | 00m00s [263/303] Installing perl-Text-Diff-0:1 100% | 83.1 MiB/s | 85.1 KiB | 00m00s [264/303] Installing perl-Archive-Tar-0 100% | 10.2 MiB/s | 156.9 KiB | 00m00s [265/303] Installing perl-Module-Signat 100% | 9.0 MiB/s | 138.8 KiB | 00m00s [266/303] Installing perl-Text-Template 100% | 111.3 MiB/s | 114.0 KiB | 00m00s [267/303] Installing perl-MRO-Compat-0: 100% | 43.8 MiB/s | 44.9 KiB | 00m00s [268/303] Installing perl-Package-Gener 100% | 30.8 MiB/s | 31.5 KiB | 00m00s [269/303] Installing perl-Sub-Exporter- 100% | 65.7 MiB/s | 201.9 KiB | 00m00s [270/303] Installing perl-Data-Section- 100% | 43.0 MiB/s | 44.1 KiB | 00m00s [271/303] Installing perl-Software-Lice 100% | 100.2 MiB/s | 513.1 KiB | 00m00s [272/303] Installing perl-Module-Build- 100% | 34.1 MiB/s | 663.2 KiB | 00m00s [273/303] Installing perl-TermReadKey-0 100% | 32.3 MiB/s | 66.2 KiB | 00m00s [274/303] Installing perl-Error-1:0.170 100% | 39.0 MiB/s | 80.0 KiB | 00m00s [275/303] Installing git-0:2.50.1-1.fc4 100% | 85.2 MiB/s | 87.2 KiB | 00m00s [276/303] Installing perl-Git-0:2.50.1- 100% | 63.5 MiB/s | 65.0 KiB | 00m00s [277/303] Installing rocm-clang-0:19-12 100% | 67.5 MiB/s | 70.2 MiB | 00m01s [278/303] Installing rocm-clang-devel-0 100% | 90.9 MiB/s | 23.5 MiB | 00m00s [279/303] Installing rocm-device-libs-0 100% | 76.5 MiB/s | 3.2 MiB | 00m00s [280/303] Installing rocm-comgr-devel-0 100% | 48.6 MiB/s | 99.6 KiB | 00m00s [281/303] Installing hipcc-0:19-12.rocm 100% | 27.8 MiB/s | 654.3 KiB | 00m00s [282/303] Installing rocm-hip-0:6.4.2-1 100% | 265.4 MiB/s | 24.9 MiB | 00m00s [283/303] Installing libdb-0:5.3.28-65. 100% | 231.8 MiB/s | 1.9 MiB | 00m00s [284/303] Installing perl-DB_File-0:1.8 100% | 93.1 MiB/s | 190.6 KiB | 00m00s [285/303] Installing emacs-filesystem-1 100% | 265.6 KiB/s | 544.0 B | 00m00s [286/303] Installing libstdc++-devel-0: 100% | 195.4 MiB/s | 16.2 MiB | 00m00s [287/303] Installing gcc-c++-0:15.1.1-3 100% | 275.6 MiB/s | 41.3 MiB | 00m00s [288/303] Installing perl-ExtUtils-CBui 100% | 33.2 MiB/s | 102.1 KiB | 00m00s [289/303] Installing perl-CPAN-0:2.38-5 100% | 79.0 MiB/s | 1.9 MiB | 00m00s [290/303] Installing perl-4:5.42.0-519. 100% | 121.1 KiB/s | 124.0 B | 00m00s [291/303] Installing rhash-0:1.4.5-2.fc 100% | 21.8 MiB/s | 356.4 KiB | 00m00s [292/303] Installing libuv-1:1.51.0-1.f 100% | 139.9 MiB/s | 573.0 KiB | 00m00s [293/303] Installing jsoncpp-0:1.9.6-1. 100% | 128.5 MiB/s | 263.1 KiB | 00m00s [294/303] Installing cmake-0:3.31.6-3.f 100% | 246.5 MiB/s | 34.5 MiB | 00m00s [295/303] Installing cmake-data-0:3.31. 100% | 52.7 MiB/s | 9.1 MiB | 00m00s [296/303] Installing rocm-cmake-0:6.4.0 100% | 66.2 MiB/s | 135.6 KiB | 00m00s [297/303] Installing hipify-0:6.4.1-2.f 100% | 134.2 MiB/s | 3.1 MiB | 00m00s [298/303] Installing rocm-hip-devel-0:6 100% | 115.5 MiB/s | 2.8 MiB | 00m00s [299/303] Installing rocm-rpm-macros-0: 100% | 19.0 MiB/s | 19.5 KiB | 00m00s [300/303] Installing rocm-smi-devel-0:6 100% | 138.7 MiB/s | 284.0 KiB | 00m00s [301/303] Installing rocm-core-devel-0: 100% | 15.8 MiB/s | 16.1 KiB | 00m00s [302/303] Installing annobin-plugin-gcc 100% | 32.9 MiB/s | 1.0 MiB | 00m00s [303/303] Installing gcc-plugin-annobin 100% | 207.2 KiB/s | 58.6 KiB | 00m00s Warning: skipped OpenPGP checks for 31 packages from repository: copr_base Complete! Finish: build setup for rccl-6.4.2-1.fc43.src.rpm Start: rpmbuild rccl-6.4.2-1.fc43.src.rpm Building target platforms: x86_64 Building for target x86_64 setting SOURCE_DATE_EPOCH=1753142400 Executing(%mkbuilddir): /bin/sh -e /var/tmp/rpm-tmp.JSsvw2 Executing(%prep): /bin/sh -e /var/tmp/rpm-tmp.WymhLA + umask 022 + cd /builddir/build/BUILD/rccl-6.4.2-build + cd /builddir/build/BUILD/rccl-6.4.2-build + rm -rf rccl-rocm-6.4.2 + /usr/lib/rpm/rpmuncompress -x /builddir/build/SOURCES/RCCL-6.4.2.tar.gz + STATUS=0 + '[' 0 -ne 0 ']' + cd rccl-rocm-6.4.2 + /usr/bin/chmod -Rf a+rX,u+w,g-w,o-w . + sed -i -e '/AMD GPU targets to compile for/d' CMakeLists.txt + sed -i -e 's@cat ${ROCM_PATH}/.info/version@echo 6.4.2@' CMakeLists.txt + sed -i -e s@rocm-core/rocm_version.h@rocm_version.h@ src/include/hip_rocm_version_info.h + sed -i -e 's@if (ENABLE_MSCCLPP AND NOT(${HOST_OS_ID} STREQUAL "ubuntu" OR ${HOST_OS_ID} STREQUAL "centos"))@if (ENABLE_MSCCLPP)@' CMakeLists.txt + sed -i '/#include ' test/common/TestBed.hpp + RPM_EC=0 ++ jobs -p + exit 0 Executing(%build): /bin/sh -e /var/tmp/rpm-tmp.vCjhzZ + umask 022 + cd /builddir/build/BUILD/rccl-6.4.2-build + CFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer ' + export CFLAGS + CXXFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer' + export CXXFLAGS + FFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FFLAGS + FCFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FCFLAGS + VALAFLAGS=-g + export VALAFLAGS + RUSTFLAGS='-Copt-level=3 -Cdebuginfo=2 -Ccodegen-units=1 -Cstrip=none -Cforce-frame-pointers=yes -Clink-arg=-specs=/usr/lib/rpm/redhat/redhat-package-notes --cap-lints=warn' + export RUSTFLAGS + LDFLAGS='-Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes ' + export LDFLAGS + LT_SYS_LIBRARY_PATH=/usr/lib64: + export LT_SYS_LIBRARY_PATH + CC=hipcc + export CC + CXX=hipcc + export CXX + cd rccl-rocm-6.4.2 + CFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer ' + export CFLAGS + CXXFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer' + export CXXFLAGS + FFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FFLAGS + FCFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FCFLAGS + VALAFLAGS=-g + export VALAFLAGS + RUSTFLAGS='-Copt-level=3 -Cdebuginfo=2 -Ccodegen-units=1 -Cstrip=none -Cforce-frame-pointers=yes -Clink-arg=-specs=/usr/lib/rpm/redhat/redhat-package-notes --cap-lints=warn' + export RUSTFLAGS + LDFLAGS='-Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes ' + export LDFLAGS + LT_SYS_LIBRARY_PATH=/usr/lib64: + export LT_SYS_LIBRARY_PATH + CC=hipcc + export CC + CXX=hipcc + export CXX + /usr/bin/cmake -S . -B redhat-linux-build -DCMAKE_C_FLAGS_RELEASE:STRING=-DNDEBUG -DCMAKE_CXX_FLAGS_RELEASE:STRING=-DNDEBUG -DCMAKE_Fortran_FLAGS_RELEASE:STRING=-DNDEBUG -DCMAKE_VERBOSE_MAKEFILE:BOOL=ON -DCMAKE_INSTALL_DO_STRIP:BOOL=OFF -DCMAKE_INSTALL_PREFIX:PATH=/usr -DCMAKE_INSTALL_FULL_SBINDIR:PATH=/usr/bin -DCMAKE_INSTALL_SBINDIR:PATH=bin -DINCLUDE_INSTALL_DIR:PATH=/usr/include -DLIB_INSTALL_DIR:PATH=/usr/lib64 -DSYSCONF_INSTALL_DIR:PATH=/etc -DSHARE_INSTALL_PREFIX:PATH=/usr/share -DLIB_SUFFIX=64 -DBUILD_SHARED_LIBS:BOOL=ON '-DAMDGPU_TARGETS=gfx90a:xnack+;gfx90a:xnack-;gfx1100;gfx1101;gfx1102;gfx1200;gfx1201' -DBUILD_FILE_REORG_BACKWARD_COMPATIBILITY=OFF -DBUILD_TESTS=OFF -DCMAKE_BUILD_TYPE=RelWithDebInfo -DCMAKE_C_COMPILER=/usr/bin/hipcc -DCMAKE_CXX_COMPILER=/usr/bin/hipcc -DCMAKE_EXPORT_COMPILE_COMMANDS=OFF -DCMAKE_INSTALL_LIBDIR=/usr/lib64 -DCMAKE_SKIP_RPATH=ON -DENABLE_MSCCLPP=OFF -DHIP_PLATFORM=amd -DRCCL_ROCPROFILER_REGISTER=OFF -DROCM_PATH=/usr -DROCM_SYMLINK_LIBS=OFF CMake Deprecation Warning at CMakeLists.txt:6 (cmake_minimum_required): Compatibility with CMake < 3.10 will be removed from a future version of CMake. Update the VERSION argument value. Or, use the ... syntax to tell CMake that the project requires at least but has been updated to work with policies introduced by or earlier. -- CMAKE_TOOLCHAIN_FILE: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/toolchain-linux.cmake -- The CXX compiler identification is Clang 19.0.0 -- Detecting CXX compiler ABI info -- Detecting CXX compiler ABI info - done -- Check for working CXX compiler: /usr/bin/hipcc - skipped -- Detecting CXX compile features -- Detecting CXX compile features - done -- Could NOT find GTest (missing: GTEST_LIBRARY GTEST_INCLUDE_DIR GTEST_MAIN_LIBRARY) (Required is at least version "1.11") CMake Deprecation Warning at /usr/share/rocm/cmake/ROCMConfig.cmake:12 (message): Use of find_package(ROCM) is deprecated as of ROCm 6.4. Please use find_package(ROCmCMakeBuildTools) Call Stack (most recent call first): cmake/Dependencies.cmake:75 (find_package) CMakeLists.txt:55 (include) -- Checking for ROCm support for GPU targets: gfx906;gfx908;gfx90a;gfx942;gfx1030;gfx1100;gfx1101;gfx1102;gfx1200;gfx1201 -- Performing Test COMPILER_HAS_TARGET_ID_gfx906 -- Performing Test COMPILER_HAS_TARGET_ID_gfx906 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx908 -- Performing Test COMPILER_HAS_TARGET_ID_gfx908 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx90a -- Performing Test COMPILER_HAS_TARGET_ID_gfx90a - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx942 -- Performing Test COMPILER_HAS_TARGET_ID_gfx942 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx1030 -- Performing Test COMPILER_HAS_TARGET_ID_gfx1030 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx1100 -- Performing Test COMPILER_HAS_TARGET_ID_gfx1100 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx1101 -- Performing Test COMPILER_HAS_TARGET_ID_gfx1101 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx1102 -- Performing Test COMPILER_HAS_TARGET_ID_gfx1102 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx1200 -- Performing Test COMPILER_HAS_TARGET_ID_gfx1200 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx1201 -- Performing Test COMPILER_HAS_TARGET_ID_gfx1201 - Success -- Compiling for gfx906;gfx908;gfx90a;gfx942;gfx1030;gfx1100;gfx1101;gfx1102;gfx1200;gfx1201 -- Could NOT find GTest (missing: GTEST_LIBRARY GTEST_INCLUDE_DIR GTEST_MAIN_LIBRARY) (Required is at least version "1.11") CMake Deprecation Warning at /usr/share/rocm/cmake/ROCMConfig.cmake:12 (message): Use of find_package(ROCM) is deprecated as of ROCm 6.4. Please use find_package(ROCmCMakeBuildTools) Call Stack (most recent call first): cmake/Dependencies.cmake:75 (find_package) CMakeLists.txt:102 (include) -- ROCM_PATH found: /usr -- Compiling with hipcc -- Performing Test CMAKE_HAVE_LIBC_PTHREAD -- Performing Test CMAKE_HAVE_LIBC_PTHREAD - Success -- Found Threads: TRUE -- Performing Test HIP_CLANG_SUPPORTS_PARALLEL_JOBS -- Performing Test HIP_CLANG_SUPPORTS_PARALLEL_JOBS - Success -- HIP compiler: clang -- HIP runtime: rocclr -- hipcc executable: /usr/bin/hipcc sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory -- hipcc version: 6.4.43484 -- hipconfig executable: /usr/bin/hipconfig -- hipcc HIP version: 6.4.43484 -- ROCm version: 6.4.2 -- Looking for hipDeviceMallocUncached -- Looking for hipDeviceMallocUncached - found -- Looking for hipDeviceMallocContiguous -- Looking for hipDeviceMallocContiguous - found -- RCCL LL128 protocol enabled -- HSA runtime: /usr/include -- Found rocm_smi at /usr/include -- Looking for C++ include /usr/include/rocm_smi/rocm_smi64Config.h -- Looking for C++ include /usr/include/rocm_smi/rocm_smi64Config.h - found -- RSMI_INIT_FLAG_THRAD_ONLY_MUTEX supported -- Performing Test HAVE_KERNARG_PRELOAD -- Performing Test HAVE_KERNARG_PRELOAD - Success -- Kernarg preloading to SGPR enabled -- Performing Test HAVE_PARALLEL_JOBS -- Performing Test HAVE_PARALLEL_JOBS - Success -- Parallel jobs enabled CMake Warning at CMakeLists.txt:331 (message): ROCTX library not found. Skipping ROCTX linking. -- Found Python3: /usr/bin/python3.14 (found version "3.14.0") found components: Interpreter -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/device_table.h -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/device_table.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/host_table.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp -- HIP_CONTIGUOUS_MEMORY enabled -- HIP_UNCACHED_MEMORY enabled -- Use 1 jobs for linking -- Building shared RCCL library -- rocm-cmake: Set license file to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/LICENSE.txt. -- Configuring done (46.4s) -- Generating done (0.1s) CMake Warning: Manually-specified variables were not used by the project: AMDGPU_TARGETS CMAKE_CXX_FLAGS_RELEASE CMAKE_C_FLAGS_RELEASE CMAKE_Fortran_FLAGS_RELEASE CMAKE_INSTALL_DO_STRIP LIB_SUFFIX SHARE_INSTALL_PREFIX SYSCONF_INSTALL_DIR -- Build files have been written to: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build + /usr/bin/cmake --build redhat-linux-build -j2 --verbose Change Dir: '/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build' Run Build Command(s): /usr/bin/cmake -E env VERBOSE=1 /usr/bin/gmake -f Makefile -j2 /usr/bin/cmake -S/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2 -B/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build --check-build-system CMakeFiles/Makefile.cmake 0 /usr/bin/cmake -E cmake_progress_start /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/CMakeFiles /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build//CMakeFiles/progress.marks /usr/bin/gmake -f CMakeFiles/Makefile2 all gmake[1]: Entering directory '/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build' /usr/bin/gmake -f CMakeFiles/git_version_check.dir/build.make CMakeFiles/git_version_check.dir/depend gmake[2]: Entering directory '/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build' cd /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2 /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2 /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/CMakeFiles/git_version_check.dir/DependInfo.cmake "--color=" gmake[2]: Leaving directory '/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build' /usr/bin/gmake -f CMakeFiles/git_version_check.dir/build.make CMakeFiles/git_version_check.dir/build gmake[2]: Entering directory '/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build' [ 0%] Updating git_version.cpp if necessary /usr/bin/cmake -P /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/git_version.cmake -- Updating git_version.cpp gmake[2]: Leaving directory '/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build' [ 0%] Built target git_version_check /usr/bin/gmake -f CMakeFiles/rccl.dir/build.make CMakeFiles/rccl.dir/depend gmake[2]: Entering directory '/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build' [ 0%] Hipifying src/transport/shm.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/transport/shm.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc [ 0%] Hipifying src/bootstrap.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/bootstrap.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc [ 0%] Hipifying src/channel.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/channel.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc [ 0%] Hipifying src/collectives.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/collectives.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc [ 1%] Hipifying src/debug.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/debug.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/debug.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/debug.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/debug.cc [ 1%] Hipifying src/device/all_gather.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/all_gather.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h [ 2%] Hipifying src/device/all_reduce.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/all_reduce.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h [ 2%] Hipifying src/device/alltoall_pivot.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/alltoall_pivot.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h [ 2%] Hipifying src/device/broadcast.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/broadcast.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h [ 2%] Hipifying src/device/common.cu -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.cu.cpp mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/common.cu -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.cu.cpp && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.cu.cpp Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h [ 2%] Hipifying src/device/common.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/common.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h [ 3%] Hipifying src/device/common_kernel.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common_kernel.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/common_kernel.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common_kernel.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common_kernel.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h [ 4%] Hipifying src/device/msccl_kernel_impl.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/msccl_kernel_impl.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common_kernel.h [ 4%] Hipifying src/device/network/unpack/unpack.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack/unpack.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/network/unpack/unpack.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack/unpack.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack/unpack.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack/unpack.h [ 5%] Hipifying src/device/network/unpack/unpack_defs.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack/unpack_defs.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/network/unpack/unpack_defs.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack/unpack_defs.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack/unpack_defs.h [ 5%] Hipifying src/device/onerank.cu -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/onerank.cu -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack/unpack_defs.h [ 5%] Hipifying src/device/op128.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/op128.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/op128.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/op128.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/op128.h [ 5%] Hipifying src/device/primitives.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/primitives.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/op128.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h [ 6%] Hipifying src/device/prims_ll.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/prims_ll.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h [ 6%] Hipifying src/device/prims_ll128.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/prims_ll128.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h [ 6%] Hipifying src/device/prims_simple.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/prims_simple.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h [ 6%] Hipifying src/device/reduce.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/reduce.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h [ 6%] Hipifying src/device/reduce_kernel.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_kernel.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/reduce_kernel.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_kernel.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_kernel.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h [ 7%] Hipifying src/device/reduce_scatter.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/reduce_scatter.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_kernel.h [ 7%] Hipifying src/device/sendrecv.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/device/sendrecv.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h [ 7%] Hipifying src/enqueue.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/enqueue.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h [ 7%] Hipifying src/graph/connect.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/graph/connect.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc [ 7%] Hipifying src/graph/paths.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/graph/paths.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc [ 8%] Hipifying src/graph/rings.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rings.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/graph/rings.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rings.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rings.cc [ 8%] Hipifying src/graph/rings.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rings.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/graph/rings.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rings.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rings.h [ 8%] Hipifying src/graph/rome_models.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/graph/rome_models.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc [ 8%] Hipifying src/graph/rome_models.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/graph/rome_models.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.h [ 9%] Hipifying src/graph/search.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/graph/search.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc [ 9%] Hipifying src/graph/topo.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/graph/topo.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc [ 9%] Hipifying src/graph/topo.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/graph/topo.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h [ 9%] Hipifying src/graph/trees.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/trees.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/graph/trees.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/trees.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/trees.cc [ 10%] Hipifying src/graph/tuning.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/graph/tuning.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc [ 10%] Hipifying src/graph/xml.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/graph/xml.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc [ 10%] Hipifying src/graph/xml.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/graph/xml.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h [ 10%] Hipifying src/group.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/group.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc [ 10%] Hipifying src/include/BfdBacktrace.hpp -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/BfdBacktrace.hpp mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/BfdBacktrace.hpp -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/BfdBacktrace.hpp && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/BfdBacktrace.hpp [ 10%] Hipifying src/include/alloc.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/alloc.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h [ 11%] Hipifying src/include/alt_rsmi.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alt_rsmi.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/alt_rsmi.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alt_rsmi.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alt_rsmi.h [ 11%] Hipifying src/include/api_trace.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/api_trace.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/api_trace.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/api_trace.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/api_trace.h [ 11%] Hipifying src/include/archinfo.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/archinfo.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/archinfo.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/archinfo.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/archinfo.h [ 11%] Hipifying src/include/argcheck.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/argcheck.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h [ 12%] Hipifying src/include/bitops.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/bitops.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/bitops.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/bitops.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/bitops.h [ 12%] Hipifying src/include/bootstrap.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/bootstrap.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/bootstrap.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/bootstrap.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/bootstrap.h [ 12%] Hipifying src/include/channel.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/channel.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h [ 12%] Hipifying src/include/checks.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/checks.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/checks.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/checks.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/checks.h [ 12%] Hipifying src/include/coll_net.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/coll_net.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h [ 13%] Hipifying src/include/collectives.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/collectives.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h [ 13%] Hipifying src/include/comm.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/comm.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h [ 13%] Hipifying src/include/core.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/core.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h [ 14%] Hipifying src/include/cpuset.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/cpuset.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/cpuset.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/cpuset.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/cpuset.h [ 14%] Hipifying src/include/debug.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/debug.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/debug.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/debug.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/debug.h [ 14%] Hipifying src/include/device.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/device.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h [ 14%] Hipifying src/include/enqueue.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/enqueue.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h [ 15%] Hipifying src/include/gdrwrap.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/gdrwrap.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h [ 15%] Hipifying src/include/git_version.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/git_version.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/git_version.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/git_version.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/git_version.h [ 15%] Hipifying src/include/group.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/group.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h [ 15%] Hipifying src/include/graph.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/graph.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h [ 16%] Hipifying src/include/hip_rocm_version_info.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/hip_rocm_version_info.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/hip_rocm_version_info.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/hip_rocm_version_info.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/hip_rocm_version_info.h [ 16%] Hipifying src/include/ibvcore.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvcore.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/ibvcore.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvcore.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvcore.h [ 16%] Hipifying src/include/ibvsymbols.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvsymbols.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/ibvsymbols.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvsymbols.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvsymbols.h [ 16%] Hipifying src/include/ibvwrap.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvwrap.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/ibvwrap.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvwrap.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvwrap.h [ 17%] Hipifying src/include/info.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/info.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h [ 17%] Hipifying src/include/ipcsocket.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ipcsocket.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/ipcsocket.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ipcsocket.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ipcsocket.h [ 17%] Hipifying src/include/msccl/msccl_kernel.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_kernel.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/msccl/msccl_kernel.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_kernel.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_kernel.h [ 17%] Hipifying src/include/msccl/msccl_lifecycle.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_lifecycle.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/msccl/msccl_lifecycle.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_lifecycle.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_lifecycle.h [ 17%] Hipifying src/include/msccl/msccl_parser.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/msccl/msccl_parser.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h [ 17%] Hipifying src/include/msccl/msccl_scheduler.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_scheduler.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/msccl/msccl_scheduler.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_scheduler.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_scheduler.h [ 18%] Hipifying src/include/msccl/msccl_setup.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_setup.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/msccl/msccl_setup.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_setup.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_setup.h [ 18%] Hipifying src/include/msccl/msccl_status.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_status.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/msccl/msccl_status.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_status.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_status.h [ 18%] Hipifying src/include/msccl/msccl_struct.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/msccl/msccl_struct.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h [ 18%] Hipifying src/include/nccl_common.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nccl_common.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nccl_common.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nccl_common.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nccl_common.h [ 18%] Hipifying src/include/nccl_net.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nccl_net.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nccl_net.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nccl_net.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nccl_net.h [ 19%] Hipifying src/include/nccl_tuner.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nccl_tuner.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nccl_tuner.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nccl_tuner.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nccl_tuner.h [ 19%] Hipifying src/include/net.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/net.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h [ 19%] Hipifying src/include/net_device.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net_device.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/net_device.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net_device.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net_device.h [ 19%] Hipifying src/include/npkit/npkit.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/npkit/npkit.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit.h [ 20%] Hipifying src/include/npkit/npkit_event.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit_event.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/npkit/npkit_event.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit_event.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit_event.h [ 20%] Hipifying src/include/npkit/npkit_struct.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit_struct.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/npkit/npkit_struct.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit_struct.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit_struct.h [ 20%] Hipifying src/include/nvmlwrap.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvmlwrap.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvmlwrap.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvmlwrap.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvmlwrap.h [ 21%] Hipifying src/include/nvtx.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx.h [ 21%] Hipifying src/include/nvtx3/nvToolsExt.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExt.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvToolsExt.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExt.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExt.h [ 21%] Hipifying src/include/nvtx3/nvToolsExtCounters.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCounters.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvToolsExtCounters.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCounters.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCounters.h [ 22%] Hipifying src/include/nvtx3/nvToolsExtCuda.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCuda.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvToolsExtCuda.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCuda.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCuda.h [ 22%] Hipifying src/include/nvtx3/nvToolsExtCudaRt.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCudaRt.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvToolsExtCudaRt.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCudaRt.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCudaRt.h [ 22%] Hipifying src/include/nvtx3/nvToolsExtMem.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtMem.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvToolsExtMem.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtMem.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtMem.h [ 22%] Hipifying src/include/nvtx3/nvToolsExtMemCudaRt.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtMemCudaRt.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvToolsExtMemCudaRt.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtMemCudaRt.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtMemCudaRt.h [ 23%] Hipifying src/include/nvtx3/nvToolsExtOpenCL.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtOpenCL.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvToolsExtOpenCL.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtOpenCL.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtOpenCL.h [ 23%] Hipifying src/include/nvtx3/nvToolsExtPayload.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtPayload.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvToolsExtPayload.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtPayload.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtPayload.h [ 23%] Hipifying src/include/nvtx3/nvToolsExtPayloadHelper.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtPayloadHelper.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvToolsExtPayloadHelper.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtPayloadHelper.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtPayloadHelper.h [ 23%] Hipifying src/include/nvtx3/nvToolsExtSemanticsCounters.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtSemanticsCounters.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvToolsExtSemanticsCounters.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtSemanticsCounters.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtSemanticsCounters.h [ 24%] Hipifying src/include/nvtx3/nvToolsExtSemanticsScope.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtSemanticsScope.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvToolsExtSemanticsScope.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtSemanticsScope.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtSemanticsScope.h [ 24%] Hipifying src/include/nvtx3/nvToolsExtSync.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtSync.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvToolsExtSync.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtSync.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtSync.h [ 24%] Hipifying src/include/nvtx3/nvtx3.hpp -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtx3.hpp -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp [ 24%] Hipifying src/include/nvtx3/nvtxDetail/nvtxExtHelperMacros.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtHelperMacros.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxExtHelperMacros.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtHelperMacros.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtHelperMacros.h [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxExtImpl.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtImpl.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxExtImpl.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtImpl.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtImpl.h [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxExtImplCounters_v1.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtImplCounters_v1.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxExtImplCounters_v1.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtImplCounters_v1.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtImplCounters_v1.h [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxExtImplMemCudaRt_v1.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtImplMemCudaRt_v1.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxExtImplMemCudaRt_v1.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtImplMemCudaRt_v1.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtImplMemCudaRt_v1.h [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxExtImplMem_v1.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtImplMem_v1.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxExtImplMem_v1.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtImplMem_v1.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtImplMem_v1.h [ 26%] Hipifying src/include/nvtx3/nvtxDetail/nvtxExtImplPayload_v1.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtImplPayload_v1.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxExtImplPayload_v1.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtImplPayload_v1.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtImplPayload_v1.h [ 26%] Hipifying src/include/nvtx3/nvtxDetail/nvtxExtInit.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtInit.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxExtInit.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtInit.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtInit.h [ 26%] Hipifying src/include/nvtx3/nvtxDetail/nvtxExtPayloadHelperInternal.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtPayloadHelperInternal.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxExtPayloadHelperInternal.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtPayloadHelperInternal.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtPayloadHelperInternal.h [ 26%] Hipifying src/include/nvtx3/nvtxDetail/nvtxExtPayloadTypeInfo.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtPayloadTypeInfo.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxExtPayloadTypeInfo.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtPayloadTypeInfo.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtPayloadTypeInfo.h [ 27%] Hipifying src/include/nvtx3/nvtxDetail/nvtxExtTypes.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtTypes.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxExtTypes.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtTypes.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxExtTypes.h [ 27%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImpl.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImpl.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxImpl.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImpl.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImpl.h [ 27%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplCore.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCore.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxImplCore.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCore.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCore.h [ 28%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h [ 28%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h [ 28%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h [ 28%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h [ 28%] Hipifying src/include/nvtx3/nvtxDetail/nvtxInit.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInit.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxInit.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInit.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInit.h [ 29%] Hipifying src/include/nvtx3/nvtxDetail/nvtxInitDecls.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDecls.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxInitDecls.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDecls.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDecls.h [ 29%] Hipifying src/include/nvtx3/nvtxDetail/nvtxInitDefs.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDefs.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxInitDefs.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDefs.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDefs.h [ 29%] Hipifying src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h [ 29%] Hipifying src/include/nvtx3/nvtxDetail/nvtxTypes.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxTypes.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx3/nvtxDetail/nvtxTypes.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxTypes.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxTypes.h [ 29%] Hipifying src/include/nvtx_stub.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx_stub.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/nvtx_stub.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx_stub.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx_stub.h [ 29%] Hipifying src/include/p2p.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/p2p.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h [ 29%] Hipifying src/include/param.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/param.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/param.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/param.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/param.h [ 30%] Hipifying src/include/profiler.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/profiler.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h [ 30%] Hipifying src/include/proxy.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/proxy.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h [ 30%] Hipifying src/include/rccl_common.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/rccl_common.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h [ 30%] Hipifying src/include/rccl_float8.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/rccl_float8.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h [ 30%] Hipifying src/include/rccl_vars.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_vars.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/rccl_vars.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_vars.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_vars.h [ 31%] Hipifying src/include/register.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/register.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/register.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/register.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/register.h [ 31%] Hipifying src/include/rocm_smi_wrap.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rocm_smi_wrap.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/rocm_smi_wrap.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rocm_smi_wrap.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rocm_smi_wrap.h [ 31%] Hipifying src/include/rocmwrap.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rocmwrap.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/rocmwrap.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rocmwrap.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rocmwrap.h [ 32%] Hipifying src/include/roctx.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/roctx.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h [ 32%] Hipifying src/include/shm.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/shm.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/shm.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/shm.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/shm.h [ 32%] Hipifying src/include/signals.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/signals.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/signals.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/signals.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/signals.h [ 32%] Hipifying src/include/socket.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/socket.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/socket.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/socket.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/socket.h [ 33%] Hipifying src/include/strongstream.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/strongstream.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/strongstream.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/strongstream.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/strongstream.h [ 33%] Hipifying src/include/timer.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/timer.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/timer.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/timer.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/timer.h [ 33%] Hipifying src/include/transport.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/transport.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/transport.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/transport.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/transport.h [ 33%] Hipifying src/include/trees.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/trees.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/trees.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/trees.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/trees.h [ 34%] Hipifying src/include/tuner.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/tuner.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h [ 34%] Hipifying src/include/utils.h -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/include/utils.h -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h [ 34%] Hipifying src/init.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/init.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc [ 35%] Hipifying src/init_nvtx.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/init_nvtx.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc [ 36%] Hipifying src/misc/alt_rsmi.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/alt_rsmi.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc [ 36%] Hipifying src/misc/api_trace.c -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/api_trace.c mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/api_trace.c -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/api_trace.c && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/api_trace.c [ 37%] Hipifying src/misc/api_trace.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/api_trace.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/api_trace.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/api_trace.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/api_trace.cc [ 37%] Hipifying src/misc/archinfo.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/archinfo.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/archinfo.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/archinfo.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/archinfo.cc [ 37%] Hipifying src/misc/argcheck.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/argcheck.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc [ 37%] Hipifying src/misc/ibvsymbols.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvsymbols.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/ibvsymbols.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvsymbols.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvsymbols.cc [ 37%] Hipifying src/misc/ibvwrap.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvwrap.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/ibvwrap.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvwrap.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvwrap.cc [ 37%] Hipifying src/misc/ipcsocket.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ipcsocket.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/ipcsocket.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ipcsocket.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ipcsocket.cc [ 38%] Hipifying src/misc/msccl/msccl_lifecycle.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/msccl/msccl_lifecycle.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc [ 38%] Hipifying src/misc/msccl/msccl_parser.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/msccl/msccl_parser.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc [ 38%] Hipifying src/misc/msccl/msccl_setup.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/msccl/msccl_setup.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc [ 38%] Hipifying src/misc/msccl/msccl_status.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/msccl/msccl_status.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc [ 38%] Hipifying src/misc/npkit.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/npkit.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc [ 39%] Hipifying src/misc/nvmlwrap_stub.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/nvmlwrap_stub.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/nvmlwrap_stub.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/nvmlwrap_stub.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/nvmlwrap_stub.cc [ 39%] Hipifying src/misc/param.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/param.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/param.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/param.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/param.cc [ 39%] Hipifying src/misc/profiler.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/profiler.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc [ 39%] Hipifying src/misc/rocm_smi_wrap.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/rocm_smi_wrap.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc [ 40%] Hipifying src/misc/rocmwrap.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocmwrap.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/rocmwrap.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocmwrap.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocmwrap.cc [ 40%] Hipifying src/misc/roctx.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/roctx.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/roctx.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/roctx.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/roctx.cc [ 40%] Hipifying src/misc/shmutils.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/shmutils.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc [ 40%] Hipifying src/misc/signals.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/signals.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/signals.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/signals.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/signals.cc [ 41%] Hipifying src/misc/socket.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/socket.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc [ 41%] Hipifying src/misc/strongstream.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/strongstream.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/strongstream.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/strongstream.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/strongstream.cc [ 41%] Hipifying src/misc/tuner.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/tuner.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc [ 41%] Hipifying src/misc/utils.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/utils.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/misc/utils.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/utils.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/utils.cc [ 41%] Hipifying src/msccl.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/msccl.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc [ 41%] Hipifying src/net.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/net.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc [ 41%] Hipifying src/proxy.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/proxy.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc [ 42%] Hipifying src/rccl_wrap.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/rccl_wrap.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc [ 42%] Hipifying src/register.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/register.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc [ 42%] Hipifying src/transport.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/transport.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc [ 43%] Hipifying src/transport/coll_net.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/transport/coll_net.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc [ 43%] Hipifying src/transport/generic.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/transport/generic.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc [ 43%] Hipifying src/transport/net_ib.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/transport/net_ib.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc [ 44%] Hipifying src/transport/net_socket.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/transport/net_socket.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc [ 44%] Hipifying src/transport/net.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/transport/net.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc [ 44%] Hipifying src/transport/nvls.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/transport/nvls.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc [ 44%] Hipifying src/transport/p2p.cc -> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/src/transport/p2p.cc -o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc cd /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2 /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2 /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/CMakeFiles/rccl.dir/DependInfo.cmake "--color=" gmake[2]: Leaving directory '/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build' /usr/bin/gmake -f CMakeFiles/rccl.dir/build.make CMakeFiles/rccl.dir/build gmake[2]: Entering directory '/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build' [ 44%] Building CXX object CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc [ 44%] Building CXX object CMakeFiles/rccl.dir/hipify/src/channel.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/channel.cc.o -MF CMakeFiles/rccl.dir/hipify/src/channel.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/channel.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:In file included from 77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/bootstrap.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx906. 2 warnings generated when compiling for gfx942. 2 warnings generated when compiling for gfx1030. 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx908. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(voIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ id* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ [ 45%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives.cc.o -MF CMakeFiles/rccl.dir/hipify/src/collectives.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h8 warnings generated when compiling for gfx906. :13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 8 warnings generated when compiling for gfx1100. 8 warnings generated when compiling for gfx1200. 8 warnings generated when compiling for gfx1201. 8 warnings generated when compiling for gfx908. 8 warnings generated when compiling for gfx942. 8 warnings generated when compiling for gfx90a. 8 warnings generated when compiling for gfx1101. 8 warnings generated when compiling for gfx1102. 8 warnings generated when compiling for gfx1030. 8 warnings generated when compiling for host. [ 45%] Building CXX object CMakeFiles/rccl.dir/hipify/src/debug.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/debug.cc.o -MF CMakeFiles/rccl.dir/hipify/src/debug.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/debug.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/debug.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:93:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 93 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:98:23: warning: unused variable 'payload' [-Wunused-variable] 98 | NvtxParamsAllGather payload{sendcount * ncclTypeSize(datatype), datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:126:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 126 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:132:23: warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:161:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 161 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:166:22: warning: unused variable 'payload' [-Wunused-variable] 166 | NvtxParamsAllToAll payload{count * ncclTypeSize(datatype), datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:212:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 212 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:219:23: warning: unused variable 'payload' [-Wunused-variable] 219 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype), datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:261:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 261 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:267:23: warning: unused variable 'payload' [-Wunused-variable] 267 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:301:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 301 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:307:22: warning: unused variable 'payload' [-Wunused-variable] 307 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:343:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 343 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:351:20: warning: unused variable 'payload' [-Wunused-variable] 351 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:378:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 378 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:385:27: warning: unused variable 'payload' [-Wunused-variable] 385 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:412:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 412 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:418:23: warning: unused variable 'payload' [-Wunused-variable] 418 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:461:22: warning: unused variable 'payload' [-Wunused-variable] 461 | NvtxParamsSendRecv payload{count * ncclTyp/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:93:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 93 | constexpr nvtxPayloadSchemaEntry_t AllGatheSize(datatype), peer, datatype}; /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:93:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 93 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:98:23: warning: unused variable 'payload' [-Wunused-variable] 98 | NvtxParamsAllGather payload{sendcount * ncclTypeSize(datatype), datatype}; | ^~~~~~~ | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.ccerSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:98:23: warning: unused variable 'payload' [-Wunused-variable] 98 | NvtxParamsAllGather payload{sendcount * ncclTypeSize(datatype), datatype}; | ^~~~~~~ :486:22: warning: unused variable 'payload' [-Wunused-variable] 486 | NvtxParamsSendRecv payload{count * ncclTyp/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cceSize(datatype),:126:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 126 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:132:23: warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op, datatype}; | ^~~~~~~ peer, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:161:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 161 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:166:22: warning: unused variable 'payload' [-Wunused-variable] 166 | NvtxParamsAllToAll payload{count * ncclTypeSize(datatype), datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:126:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 126 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:132:23: warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:93:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 93 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:98:23: warning: unused variable 'payload' [-Wunused-variable] 98 | NvtxParamsAllGather payload{sendcount * ncclTypeSize(datatype), datatype}; | ^~~~~~~ datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:93:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 93 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:98:23: warning: unused variable 'payload' [-Wunused-variable] 98 | NvtxParamsAllGather payload{sendcount * ncclTypeSize(datatype), datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:212:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 212 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:219:23: warning: unused variable 'payload' [-Wunused-variable] 219 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype), datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:126:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 126 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:132:23: warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:126:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 126 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:132:23: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:261:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 261 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:267:23: warning: unused variable 'payload' [-Wunused-variable] 267 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:161:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 161 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:161:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 161 | constexpr nvtxPay166:22: warning: unused variable 'payload' [-Wunused-variable] 166 | NvtxParamsAllToAll payload{coloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:166:22: warning: unused variable 'payload' [-Wunused-variable] 166 | NvtxParamsAllToAll payload{count * ncclTypeSize(datatype), datatype}; | ^~~~~~~ unt * ncclTypeSize(datatype), datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:161:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 161 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:166:22: warning: unused variable 'payload' [-Wunused-variable] 166 | NvtxParamsAllT/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:301:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 301 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:307:22: warning: unused variable 'payload' [-Wunused-variable] 307 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ oAll payload{count * ncclTypeSize(datatype), datatyp/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:93:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 93 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:98:23: warning: unused variable 'payload' [-Wunused-variable] 98 | NvtxParamsAllGather payload{sendcount * ncclTypeSize(datatype), datatype}; | ^~~~~~~ e}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:343:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 343 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:351:20: warning: unused variable 'payload' [-Wunused-variable] 351 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:212:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 212 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:219:23: warning: unused variable 'payload' [-Wunused-variable] 219 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype), datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:261:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 261 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:267:23: warning: unused variable 'payload' [-Wunused-variable] 267 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:212:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 212 | constexpr nvtxPayl/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:93:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 93 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:98:23: warning: unused variable 'payload' [-Wunused-variable] 98 | NvtxParamsAllGather payload{sendcount * ncclTypeSize(datatype), datatype}; | ^~~~~~~ oadSchemaEntry_t AllToAllvSchema[] = { | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:126:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 126 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:132:23: warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op, datatype}; | ^~~~~~~ ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:219:23: warning: unused variable 'payload' [-Wunused-variable] 219 | NvtxParamsAllToAllv paylo/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:378ad{sendcounts:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 378 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:385:27: warning: unused variable 'payload' [-Wunused-variable] 385 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op, datatype}; | ^~~~~~~ [comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * nc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.ccc:212:38l: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] T212 | consytexpr nvptxPayloeadSchemaESntry_t AlilToAllvSzchema[] =e /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:126:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 126 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:132:23: warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllReduce payload{ | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc(:219:23: warning: unused variable 'payload' [-Wunused-variable] d219 | NvtaxParamsAtll{count * ncclTypeSize(datatype), op, datatype}; | ^~~~~~~ ToAlalv paytype), datatype}; | ^~~~~~~ load{sendcounts[comm->rank] * ncclTypeSize(datatype), recv/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:93:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 93 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:98:23: warning: unused variable 'payload' [-Wunused-variable] 98 | NvtxParamsAllGather payload{sendcount * ncclTypeSize(datatype), datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cccounts[comm->rank] * ncclTypeSize(datatype), datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:261:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 261 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:267:23: warning: unused variable 'payload' [-Wunused-variable] 267 | NvtxParamsBroadcast payload{count */builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc :161:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 161 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:166:22: warning: unused variable 'payload' [-Wunused-variable] 166 | NvtxParamsAllToAll payload{count * ncclTypeSize(datatype), datatype}; | ^~~~~~~ ncclTypeSize(da:261:t38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] a 261 | ctons/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:412:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 412 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:418:23: warning: unused variable 'payload' [-Wunused-variable] 418 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root, datatype}; texypr nvtxpPayloaedSchem)aEntry,_t Bro adcastrSchemao[] = | ^~~~~~~ {o | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cct:267:23: ,warning: unused variable 'payload' [-Wunused-variable] 267 | NvtxdP/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.ccara:126:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 126 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:132:23: warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op, datatype}; | ^~~~~~~ msBroadcasta patyloaatype}; | ^~~~~~~ d{count * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:301:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 301 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:307:22: warning: unused variable 'payload' [-Wunused-variable] 307 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:343:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 343 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:351:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:161:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 161 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:166:22: warning: unused variable 'payload' [-Wunused-variable] 166 | NvtxParamsAllToAll payload{count * ncclTypeSize(datatype), datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:212:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 212 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:219:23: warning: unused variable 'payload' [-Wunused-variable] 219 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype), datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:301:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 301 | constexpr n20: warning: unused variable 'payload' [-Wunused-variable] v 351 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op, datatype}; | ^~~~~~~ txPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:378:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 378 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:385:27: warning: unused variable 'payload' [-Wunused-variable] 385 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op, datatype}; | ^~~~~~~ 307:22: warning: unused variable 'payload' [-Wunused-variable] 307 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.ccNvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:301:40/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:461:22: warning: unused variable 'payload' [-Wunused-variable] 461 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer, datatype}; | ^~~~~~~ : warning: unused variable 'GatherSchema' [-Wunused-variable] 301 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:307:22: warning: unused variable 'payload' [-Wunused-variable] 307 | NvtxParamsGat:93:38h: warning: unused variable 'AllGatherSchema' [-Wunused-variable] e 93 | crons texpr pnvtxPayaloadScyhemaEnltry_t AollGathaerSchemda[] = {{ | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.ccs:98:23:e warning: unused variable 'payload' [-Wunused-variable] n98 | NvdtxParacmsAllGoather puayloadn{/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.ccs:161:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 161 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:166:22: warning: unused variable 'payload' [-Wunused-variable] 166 | NvtxParamsAllToAll payload{count * ncclTypeSize(datatype), datatype}; | ^~~~~~~ ent * ncclTypeSize(datdcount * ncclTypeSize(dataty/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:212:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 212 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:219:23: warning: unused variable 'payload' [-Wunused-variable] 219 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclpe), datatype}; | ^~~~~~~ atype), roTypeSize(datatype), datatype}; | ^~~~~~~ ot, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:343:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 343 | :261:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 261 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:267:23: warning: unused variable 'payload' [-Wunused-variable] 267 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:351:20: warning: unused variable 'payload' [-Wunused-variable] 351 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op, datatype}; /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc| ^~~~~~~ :126:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 126 | static constexp/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:486:22: warning: unused variable 'payload' [-Wunused-variable] 486 | NvtxParamsSendRecv paylor anvd{count * ncclTypeSize(datatype), peer, datatype}; | ^~~~~~~ txPayloadSchemaEntry_t AllReduceSchema[]/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:261:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 261 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:267:23: warning: unused variable 'payload' [-Wunused-variable] 267 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ = /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:343:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] :378:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 378343 | co | nstexpr nvt{ x | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cccP:132:23:oa warning: unused variable 'payload' [-Wunused-variable] ny132 | slNvtxPtoaramseaAllRedxduce Spaylopcad{corhunt * e nc cnmlTypvaeSize(tEdatatxnype),Pt op,ar/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:412:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 412 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:418:23: warning: unused variable 'payload' [-Wunused-variable] 418 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ datatyype}y;_ | ^~~~~~~l t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:212:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 212 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:219:23: warning: unused variable 'payload' [-Wunused-variable] 219 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype), datatype}; | ^~~~~~~ oadSchemaEntry_t Redu ReducceScatteerScheSma[] =chema[] = { { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:385:27: warning: unused variable 'payload' [-Wunused-variable] | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:351:20: warning: unused variable 'payload' [-Wunused-variable] 351 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op, datatype}; | 385 ^~~~~~~ | Nvt xParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:261:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 261 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:267:23: warning: unused variable 'payload' [-Wunused-variable] 267 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:412:40: warning: :161:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 161 | constexpr nvtxPayloadSchemaEntry_t A/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:301:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 301 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:307:22: warning: unused variable 'payload' [-Wunused-variable] 307 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ llToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:166:22: warning: unused variable 'payload' [-Wunused-variable] 166 | NvtxParamsAllToAll payload{count * ncc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.ccl:461:22: warning: unused variable 'payload' [-Wunused-variable] 461 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer, datatype}; | ^~~~~~~ TypeSize(datatype), datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:301:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 301 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:307:22: warning: unused variable 'payload' [-Wunused-variable] 307 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ unused variable 'ScatterSchema' [-Wunused-variable] 412 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:418:23: warning: unused variable 'payload' [-Wunused-variable] 418 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), roo/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cct, datat:343:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 343 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:351:20: warning: unused variable 'payload' [-Wunused-variable] 351 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op, datatype}; | ^~~~~~~ ype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:378:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 378 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:343:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 343 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = {/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:351:20: warning: unused variable 'payload' [-Wunused-variable] 351 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op, datatype}; | ^~~~~~~ :212:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 212 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:219:23: warning: unused variable 'payload' [-Wunused-variable] 219 | Nv:t486:22: warning: unused variable 'payload' [-Wunused-variable] 486 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer, datatype}; | ^~~~~~~ xParamsAllToAllv p]a = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:385:27: warning: unused variable 'payload' [-Wunused-variable] 385 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op, datatype}; | ^~~~~~~ yloaIn file included from d{sendcounts[co:378m:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable]m 378 | - const>expr nvrtxPaylaoadSchnemaEntkry_t R]educeS catter*Schema [] = {n | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.ccc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.ccc:385l:461:22:: warning: TypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype), datatype}; | ^~~~~~~ unused variable 'payload' [-Wunused-variable] 27 461 | :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc Nvtx: Parwarning: a7msSunused variable 'payload' [-Wunused-variable]e: ndR eIn file included from cv /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.hpayl:oad{385c10oun | t: * n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:301:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 301 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:307:22: warning: unused variable 'payload' [-Wunused-variable] 307 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ In file included from ccl T/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.hypeNS:izev38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2it(xParalmsReduoceScan/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:378:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 378 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:385:27: warning: unused variable 'payload' [-Wunused-variable] 385 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op, datatype}; | ^~~~~~~ tter gpaylo ad{rencvco)unt * ncclTy{(datp atype e), S| peeri ^~~~~, d atatyIn file included from pez}; | ^~~~~~~e /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static nc(datatype), op, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:261:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 261 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:267:23: warning: unused variable 'payload' [-Wunused-variable] 267 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ clResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* sy/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:486:22: warning: unused variable 'payload' [-Wunused-variable] 486 | NvtxParams/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:343:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 343 | SendR constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:351:20: warning: unused variable 'payload' [-Wunused-variable] 351 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op, datatype}; | ^~~~~~~ ecv payload{count * ncclTypeSize(datatype), peer, datastem, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopo/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:412:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 412 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:418:23: warning: unused variable 'payload' [-Wunused-variable] 418 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ System* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | stattype}; i | ^~~~~~~ c ncclResult_t n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:412:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 412 | constexp/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:378:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable]r nvt 378 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:385:27: warning: unused variable 'payload' [-Wunused-variable] 385 | NvtxParamsReduceScatter payload{recvcount * nxPayloadSchemaEntry_t ScatterSchema[] = { cclcclTypeSize(datatype), op, datatype}; | ^~~~~~~ T opoI| dToNe ^~~~~~~~~~~~~tDev( struc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cct ncclTop:oSyst418em* s:yste23m, in:t64_t id, warning: int* unused variable 'payload' [-Wunused-variable]netDe v) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262418:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] | 262 | static floa t nc clTopoNXGMISvtxpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopParamsScatter payload{recvcount * ncclTypeSize(datatypeo)NVL,ink Bw(rinto cuodaCtomp,Cap ) {d | a ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.ht:283a:13:t warning: unused function 'isPow2' [-Wunused-function]y :412:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 412 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:418:23: warning: unused variable 'payload' [-Wunused-variable] 418 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ pe}; | ^~~~~~~ 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:448:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 448 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:93:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 93 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:98:23: warning: unused variable 'payload' [-Wunused-variable] 98 | NvtxParamsAllGather payload{sendcount * ncclTypeSize(datatype), datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:461:22: warning: unused variable 'payload' [-Wunused-variable] 461 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer, datatype}; | ^~~~~~~ :461:22: warning: unused variable 'payload' [-Wunused-variable] 461 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:301:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 301 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:307:22: warning: unused variable 'payload' [-Wunused-variable] 307 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ :486:22: warning: unused variable 'payload' [-Wunused-variable] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:412:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 412 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:418:23: warning: unused variable 'payload' [-Wunused-variable] 418 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ 486 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:126:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 126 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:132:23: warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:343:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 343 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:351:20: warning: unused variable 'payload' [-Wunused-variable] 351 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:461:22: warning: unused variable 'payload' [-Wunused-variable] 461 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:486:22: warning: unused variable 'payload' [-Wunused-variable] 486 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:486:22: warning: unused variable 'payload' [-Wunused-variable] 486 | NvtxPara/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:461:22: warning: unused variable 'payload' [-Wunused-variable] 461 | msSendRecv payload{count * ncclTypeSize(datatype), peer Nvtx/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:378:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 378 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:385:27: warning: unused variable 'payload' [-Wunused-variable] 385 | NvtxParamsReduceScatter payload{recvcount * nccParamsSendR, datatype}; | ^~~~~~~ ecv payload{countlTypeSize(datatype), op, datatype}; | ^~~~~~~ * ncclTypeSize(datatype), peer, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:161:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 161 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:166:22: warning: unused variable 'payload' [-Wunused-variable] 166 | NvtxParamsAllToAll payload{count * ncclTypeSize(datatype), datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:486:22: warning: unused variable 'payload' [-Wunused-variable] 486 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:412:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 412 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:418:23: warning: unused variable 'payload' [-Wunused-variable] 418 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:212:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 212 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:219:23: warning: unused variable 'payload' [-Wunused-variable] 219 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype), datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:261:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 261 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:267:23: warning: unused variable 'payload' [-Wunused-variable] 267 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:461:22: warning: unused variable 'payload' [-Wunused-variable] 461 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:486:22: warning: unused variable 'payload' [-Wunused-variable] 486 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:301:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 301 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:307:22: warning: unused variable 'payload' [-Wunused-variable] 307 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:343:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 343 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:351:20: warning: unused variable 'payload' [-Wunused-variable] 351 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:378:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 378 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:385:27: warning: unused variable 'payload' [-Wunused-variable] 385 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:412:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 412 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:418:23: warning: unused variable 'payload' [-Wunused-variable] 418 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:461:22: warning: unused variable 'payload' [-Wunused-variable] 461 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:486:22: warning: unused variable 'payload' [-Wunused-variable] 486 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer, datatype}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, iIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] nt* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclRewarning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncsult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] clTopoDe/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:93:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 93 | constexpr nvtxPayloadSchemaEntry_t AllGathvToRank(struct ncclTopoSystem* system, int d e249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:448:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 448 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ v, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249erSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:98:23: warning: unused variable 'payload' [-Wunused-variable] 98 | NvtxParam | stasAllGather payload{sendcount * ncclTypeSize(datatype), datatype}; | ^~~~~~~ tic ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:126:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 126 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:132:23: warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op, datatype}; | ^~~~~~~ float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:448:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 448 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:448:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 448 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc ^~~~~:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h :10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:In file included from 38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | st/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.ccatic :long 10log2i: (long /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.hn) { | ^~~~~: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:21510: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215::21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 21 215 | sta:tic ncclResult_t ncclTopoIdToInd/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:161:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 161 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:166:22: warning: unused variable 'payload' [-Wunused-variable] 166 | NvtxParamsAllToAll payload{count * ncclTypeSize(datatype), datatype}; | ^~~~~~~ ex(struct ncclTopoSystem* system, int type, int64_t idIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: , int* in warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, intunused function 'ncclTopoXGMISpeed' [-Wunused-function]* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTodex) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:448:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 448 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ _t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncpoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] clTopoSy249stem | * sysstemt, inat devt, init* rcank) { | n ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.hc:249:21c: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | statilResult_t n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:212:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 212 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:219:23: warning: unused variable 'payload' [-Wunused-variable] 219 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype), datatype}; | ^~~~~~~ cclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static c float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | statfloat ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:261:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 261 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:267:23: warning: unused variable 'payload' [-Wunused-variable] 267 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ ) { ic | int ^~~~~~mi rror/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.hBits(int :val,286 in:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cct pow2) {: | ^~~~~~~~~~448 /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc::448:42:42 warning: unused variable 'SendRecvSchema' [-Wunused-const-variable]: 448 | conswarning: texpunused variable 'SendRecvSchema' [-Wunused-const-variable]r co nst nvtxPa448yloa | dScchemaEontryn_t SsendRtecvexpr Schema[] = { | ^~~~~~~~~~~~~~ const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:448:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 448 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:301:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 301 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:307:22: warning: unused variable 'payload' [-Wunused-variable] 307 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:343:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 343 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:351:20: warning: unused variable 'payload' [-Wunused-variable] 351 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:378:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 378 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:385:27: warning: unused variable 'payload' [-Wunused-variable] 385 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:412:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 412 | constexpr nvtxPayloadSchemaEntry_t ScatterSchIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:448:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 448 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ ema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:418:23: warning: unused variable 'payload' [-Wunused-variable] 418 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:461:22: warning: unused variable 'payload' [-Wunused-variable] 461 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer, datatype}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:486:22: warning: unused variable 'payload' [-Wunused-variable] 486 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer, datatype}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:448:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 448 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/collectives.cc:448:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 448 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 31 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 31In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ warnings31 generated when compiling for gfx942. In file included from warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 31 warnings generated when compiling for gfx906. 31 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 31 warnings generated when compiling for gfx1101. 31 warnings generated when compiling for gfx908. 31 warnings generated when compiling for gfx1200. 31 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 31 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 31 warnings generated when compiling for gfx1100. 1 warning generated when compiling for host. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx1200. 1 warning generated when compiling for gfx942. [ 45%] Building CXX object CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o -MF CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1201. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx908. [ 45%] Building CXX object CMakeFiles/rccl.dir/hipify/src/group.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/group.cc.o -MF CMakeFiles/rccl.dir/hipify/src/group.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/group.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/group.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx942. 2 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 2 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | v2 warnings generated when compiling for gfx1030. oid *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md In file included from =/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ (gdr_mem_desc_t*)gdrHandle; | ^~ 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx908. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:72:5: warning: unused label 'ignore0' [-Wunused-label] 72 | ignore0:; | ^~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ 2/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ warnings generated when compiling for gfx906. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:72:5: warning: unused label 'ignore0' [-Wunused-label] 72 | ignore0:; | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:72:5: warning: unused label 'ignore0' [-Wunused-label] 72 | ignore0:; | ^~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:72:5: warning: unused label 'ignore0' [-Wunused-label] 72 | ignore0:; | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:72:5: warning: unused label 'ignore0' [-Wunused-label] 72 | ignore0:; | ^~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:72:5: warning: unused label 'ignore0' [-Wunused-label] 72 | ignore0:; | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:72:5: warning: unused label 'ignore0' [-Wunused-label] 72 | ignore0:; | ^~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/init.cc.o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/init.cc.o -MF CMakeFiles/rccl.dir/hipify/src/init.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/init.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc :72:5: warning: unused label 'ignore0' [-Wunused-label] 72 | ignore0:; | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:72:5: warning: unused label 'ignore0' [-Wunused-label] 72 | ignore0:; | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:72:5: warning: unused label 'ignore0' [-Wunused-label] 72 | ignore0:; | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:72:5: warning: unused label 'ignore0' [-Wunused-label] 72 | ignore0:; | ^~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:103:22: warning: unused function 'ncclFuncSendCount' [-Wunused-function] 103 | static inline size_t ncclFuncSendCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:106:22: warning: unused function 'ncclFuncRecvCount' [-Wunused-function] 106 | static inline size_t ncclFuncRecvCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:274:21: warning: unused function 'cleanupIpc' [-Wunused-function] 274 | static ncclResult_t cleanupIpc(struct ncclComm* comm, struct ncclCommCallback* cb) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:1069:12: warning: unused function 'calcP2pChannelCount' [-Wunused-function] 1069 | static int calcP2pChannelCount(size_t totalSize, int minChannels, int maxChannels, size_t minSize, size_t maxSize) { | ^~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclColwarning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct nccllNet-C>getProopertiesm(dev, prmops)); *return nc clSuccess; } | c ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19o:21: warning: unused function 'collNetListen' [-Wunused-function] m19 | stamtic ncc,lResult _t colliNetListnen(structt nccl* nComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(dev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetPropecomm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, irties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collntN ranke, voitd* liLstenCiomm, svoid*t* colleComm)n { NC(CLCHEsCK(cotmm->ncrclColulNet-c>conntect(h andlens, nracnksclComm* comm, int dev, voi, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | statd* hiandlec, voi ncclRd** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclesSult_tu collcNetRecduceSeupposrt(strsuct ;ncclCo mm* }comm, nc | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | sclDtataTaypetic ncclResult_t collNet_t CdataToype, nncclRnedOp_te rcedOp,t int*( supsptruct nccorted) { NCCLCHECK(comm->ncclCollNet->relComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(sduceSupport(dataTypet,ruct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, dat redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(star, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); retuuct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; }r n ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetClo | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t siszeColl(struct ncclComm*e, int type, comm,u void* collComm) { NCCLCHECK(commint64_t offset, in->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupportt fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDma(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(strucBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, vto ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGid* collComm, void* mMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool ihandle) { NCCLsPow2(int val) CHE{ | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:103:22: warning: unused function 'ncclFuncSendCount' [-Wunused-function] 103 | static inline size_t ncclFuncSendCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:106:22: warning: unused function 'ncclFuncRecvCount' [-Wunused-function] 106 | static inline size_t ncclFuncRecvCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:274:21: warning: unused function 'cleanupIpc' [-Wunused-function] 274 | static ncclResult_t cleanupIpc(struct ncclComm* comm, struct ncclCommCallback* cb) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:1069:12: warning: unused function 'calcP2pChannelCount' [-Wunused-function] 1069 | static int calcP2pChannelCount(size_t totalSize, int minChannels, int maxChannels, size_t minSize, size_t maxSize) { | ^~~~~~~~~~~~~~~~~~~ CK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:103:22: warning: unused function 'ncclFuncSendCount' [-Wunused-function] 103 | static inline size_t ncclFuncSendCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:106:22: warning: unused function 'ncclFuncRecvCount' [-Wunused-function] 106 | static inline size_t ncclFuncRecvCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:274:21: warning: unused function 'cleanupIpc' [-Wunused-function] 274 | static ncclResult_t cleanupIpc(struct ncclComm* comm, struct ncclCommCallback* cb) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:1069:12: warning: unused function 'calcP2pChannelCount' [-Wunused-function] 1069 | static int calcP2pChannelCount(size_t totalSize, int minChannels, int maxChannels, size_t minSize, size_t maxSize) { | ^~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:103:22: warning: unused function 'ncclFuncSendCount' [-Wunused-function] 103 | static inline size_t ncclFuncSendCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:106:22: warning: unused function 'ncclFuncRecvCount' [-Wunused-function] 106 | static inline size_t ncclFuncRecvCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:274:21: warning: unused function 'cleanupIpc' [-Wunused-function] 274 | static ncclResult_t cleanupIpc(struct ncclComm* comm, struct ncclCommCallback* cb) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:1069:12: warning: unused function 'calcP2pChannelCount' [-Wunused-function] 1069 | static int calcP2pChannelCount(size_t totalSize, int minChannels, int maxChannels, size_t minSize, size_t maxSize) { | ^~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHEIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, iCK(comm->ncclColnt* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->nclNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* commc,lCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCol l{ NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); retuNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclrn ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccesComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(devs; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncc, handle, listenComm)); return nlTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:103:22: warning: unused function 'ncclFuncSendCount' [-Wunused-function] 103 | static inline size_t ncclFuncSendCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:106:22: warning: unused function 'ncclFuncRecvCount' [-Wunused-function] 106 | static inline size_t ncclFuncRecvCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:274:21: warning: unused function 'cleanupIpc' [-Wunused-function] 274 | static ncclResult_t cleanupIpc(struct ncclComm* comm, struct ncclCommCallback* cb) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:1069:12: warning: unused function 'calcP2pChannelCount' [-Wunused-function] 1069 | static int calcP2pChannelCount(size_t totalSize, int minChannels, int maxChannels, size_t minSize, size_t maxSize) { | ^~~~~~~~~~~~~~~~~~~ cclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, voIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] id* data, size_t size, int type, uint64_t offset, int fd, void** 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDereg, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t sizeMr(struct ncc,l int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t siComm* comm, void* collComm, void* mhandle) { NCCze, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, LCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sveoid* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comndData, void* recvData, int count, ncclDataType_t dataTypem, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct nccl, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, TvopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:103:22: warning: unused function 'ncclFuncSendCount' [-Wunused-function] 103 | static inline size_t ncclFuncSendCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:106:22: warning: unused function 'ncclFuncRecvCount' [-Wunused-function] 106 | static inline size_t ncclFuncRecvCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:274:21: warning: unused function 'cleanupIpc' [-Wunused-function] 274 | static ncclResult_t cleanupIpc(struct ncclComm* comm, struct ncclCommCallback* cb) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:1069:12: warning: unused function 'calcP2pChannelCount' [-Wunused-function] 1069 | static int calcP2pChannelCount(size_t totalSize, int minChannels, int maxChannels, size_t minSize, size_t maxSize) { | ^~~~~~~~~~~~~~~~~~~ oid** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:103:22: warning: unused function 'ncclFuncSendCount' [-Wunused-function] 103 | static inline size_t ncclFuncSendCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:106:22: warning: unused function 'ncclFuncRecvCount' [-Wunused-function] 106 | static inline size_t ncclFuncRecvCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:274:21: warning: unused function 'cleanupIpc' [-Wunused-function] 274 | static ncclResult_t cleanupIpc(struct ncclComm* comm, struct ncclCommCallback* cb) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:1069:12: warning: unused function 'calcP2pChannelCount' [-Wunused-function] 1069 | static int calcP2pChannelCount(size_t totalSize, int minChannels, int maxChannels, size_t minSize, size_t maxSize) { | ^~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:103:22: warning: unused function 'ncclFuncSendCount' [-Wunused-function] 103 | static inline size_t ncclFuncSendCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:106:22: warning: unused function 'ncclFuncRecvCount' [-Wunused-function] 106 | static inline size_t ncclFuncRecvCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:274:21: warning: unused function 'cleanupIpc' [-Wunused-function] 274 | static ncclResult_t cleanupIpc(struct ncclComm* comm, struct ncclCommCallback* cb) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:1069:12: warning: unused function 'calcP2pChannelCount' [-Wunused-function] 1069 | static int calcP2pChannelCount(size_t totalSize, int minChannels, int maxChannels, size_t minSize, size_t maxSize) { | ^~~~~~~~~~~~~~~~~~~ 35 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:103:22: warning: unused function 'ncclFuncSendCount' [-Wunused-function] 103 | static inline size_t ncclFuncSendCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:106:22: warning: unused function 'ncclFuncRecvCount' [-Wunused-function] 106 | static inline size_t ncclFuncRecvCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:274:21: warning: unused function 'cleanupIpc' [-Wunused-function] 274 | static ncclResult_t cleanupIpc(struct ncclComm* comm, struct ncclCommCallback* cb) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:1069:12: warning: unused function 'calcP2pChannelCount' [-Wunused-function] 1069 | static int calcP2pChannelCount(size_t totalSize, int minChannels, int maxChannels, size_t minSize, size_t maxSize) { | ^~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet-In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const c>reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_htar* co llNetNcame(strouct nlcclComlNetmR* comme) {gMr(struct ncclC roeturn mcomm->mnc* comm, void* collComm, void* data, size_t clCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mcomhm->nacclCnollNdet->dlevicees(n)dev))); re;turn nccrlSucecesst; } u | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.hr:n ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:2418::21: warning: 21unused function 'collNetGetProperties' [-Wunused-function] :18 | s twarning: aticunused function 'collNetRegMrDmaBuf' [-Wunused-function] ncc lResul t_t co24 | llsNetatic ncclResult_t collNettGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fCdHECK,(com m->nvcclCoollNeti->gedtPro*pert*ies( dev,m prohps))a; renturnd nccllSucceess;) } | ^~~~~~~~~~~~~~~~~~~~ { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, da/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, voitda, s*ize,* type , offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_listtenC omm)c { NoCCLClHECKl(comNm->nceclColtlNetD->elistren(edev,g handMle,r(struct listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NncclComm* comm, void* colCCLCHEClK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclReComm, void* mhandle) { NCCLCHECK(comm->sult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm,ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclR void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopesult_t collNetTest(struct ncclComm* comm, void* request, intoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:103:22: warning: unused function 'ncclFuncSendCount' [-Wunused-function] 103 | static inline size_t ncclFuncSendCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:106:22: warning: unused function 'ncclFuncRecvCount' [-Wunused-function] 106 | static inline size_t ncclFuncRecvCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:274:21: warning: unused function 'cleanupIpc' [-Wunused-function] 274 | static ncclResult_t cleanupIpc(struct ncclComm* comm, struct ncclCommCallback* cb) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:1069:12: warning: unused function 'calcP2pChannelCount' [-Wunused-function] 1069 | static int calcP2* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHpChannelCount(size_t totalSize, int minChannels, int maxChannels, size_t minSize, size_t maxSize) { | ^~~~~~~~~~~~~~~~~~~ ECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:16: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:224:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 224 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:103:22: warning: unused function 'ncclFuncSendCount' [-Wunused-function] 103 | static inline size_t ncclFuncSendCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:106:22: warning: unused function 'ncclFuncRecvCount' [-Wunused-function] 106 | static inline size_t ncclFuncRecvCount(ncclFunc_t func, int nRanks, size_t count) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:274:21: warning: unused function 'cleanupIpc' [-Wunused-function] 274 | static ncclResult_t cleanupIpc(struct ncclComm* comm, struct ncclCommCallback* cb) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/enqueue.cc:1069:12: warning: unused function 'calcP2pChannelCount' [-Wunused-function] 1069 | static int calcP2pChannelCount(size_t totalSize, int minChannels, int maxChannels, size_t minSize, size_t maxSize) { | ^~~~~~~~~~~~~~~~~~~ 35 warnings generated when compiling for gfx90a. 35 warnings generated when compiling for gfx942. 35 warnings generated when compiling for gfx1101. 35 warnings generated when compiling for gfx1200. 35 warnings generated when compiling for gfx1201. 35 warnings generated when compiling for gfx1100. 35 warnings generated when compiling for gfx1030. 35 warnings generated when compiling for gfx1102. 35 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 35 warnings generated when compiling for host. [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o -MF CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1857:11: warning: unused variable 'stackSize' [-Wunused-variable] 1857 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1858:19: warning: unused variable 'devProp' [-Wunused-variable] 1858 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1857:11: warning: unused variable 'stackSize' [-Wunused-variable] 1857 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1858:19: warning: unused variable 'devProp' [-Wunused-variable] 1858 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1857:11: warning: unused variable 'stackSize' [-Wunused-variable] 1857 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1858:19: warning: unused variable 'devProp' [-Wunused-variable] 1858 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1857:11: warning: unused variable 'stackSize' [-Wunused-variable] 1857 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1858:19: warning: unused variable 'devProp' [-Wunused-variable] 1858 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2264:26: warning: unused variable 'payload' [-Wunused-variable] 2264 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1857:11: warning: unused variable 'stackSize' [-Wunused-variable] 1857 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1858:19: warning: unused variable 'devProp' [-Wunused-variable] 1858 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2264:26: warning: unused variable 'payload' [-Wunused-variable] 2264 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2278:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2278 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2278:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2278 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2264:26: warning: unused variable 'payload' [-Wunused-variable]/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc :2264:26: warning: unused variable 'payload' [-Wunused-variable] 2264 2264 | | NvtxParamsCommInitRank payload{my NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2278:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2278 | constexpr nvtxPayl:2278:38o: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2278 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ adSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2264:26: warning: unused variable 'payload' [-Wunused-variable] 2264 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2563:26: warning: unused variable 'payload' [-Wunused-variable] 2563 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2598:26: warning: unused variable 'payload' [-Wunused-variable] 2598 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2278:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2278 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2563:26: warning: unused variable 'payload' [-Wunused-variable] 2563 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2598:26: warning: unused variable 'payload' [-Wunused-variable] 2598 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2563:26: warning: unused variable 'payload' [-Wunused-variable] 2563 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2563:26: warning: unused variable 'payload' [-Wunused-variable] 2563 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ :2598:26: warning: unused variable 'payload' [-Wunused-variable] 2598 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2598:26: warning: unused variable 'payload' [-Wunused-variable] 2598 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1857:11: warning: unused variable 'stackSize' [-Wunused-variable] 1857 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1858:19: warning: unused variable 'devProp' [-Wunused-variable] 1858 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1857:11: warning: unused variable 'stackSize' [-Wunused-variable] 1857 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1858:19: warning: unused variable 'devProp' [-Wunused-variable] 1858 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2563:26: warning: unused variable 'payload' [-Wunused-variable] 2563 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2598:26: warning: unused variable 'payload' [-Wunused-variable] 2598 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1857:11: warning: unused variable 'stackSize' [-Wunused-variable] 1857 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1858:19: warning: unused variable 'devProp' [-Wunused-variable] 1858 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1857:11: warning: unused variable 'stackSize' [-Wunused-variable] 1857 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1858:19: warning: unused variable 'devProp' [-Wunused-variable] 1858 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2264:26: warning: unused variable 'payload' [-Wunused-variable] 2264 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2264:26: warning: unused variable 'payload' [-Wunused-variable] 2264 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2278:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2278 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2278:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2278 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2264:26: warning: unused variable 'payload' [-Wunused-variable] 2264 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1857:11: warning: unused variable 'stackSize' [-Wunused-variable] 1857 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1858:19: warning: unused variable 'devProp' [-Wunused-variable] 1858 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2278:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2278 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2264:26: warning: unused variable 'payload' [-Wunused-variable] 2264 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1857:11: warning: unused variable 'stackSize' [-Wunused-variable] 1857 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:1858:19: warning: unused variable 'devProp' [-Wunused-variable] 1858 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2264:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2278:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2278 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ warning: unused variable 'payload' [-Wunused-variable] 2264 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2563:26: warning: unused variable 'payload' [-Wunused-variable] 2563 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2563:26: warning: unused variable 'payload' [-Wunused-variable] 2563 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2598:26: warning: unused variable 'payload' [-Wunused-variable] 2598 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2598:26: warning: unused variable 'payload' [-Wunused-variable] 2598 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ :2278:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2278 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2563:26: warning: unused variable 'payload' [-Wunused-variable] 2563 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2598:26: warning: unused variable 'payload' [-Wunused-variable] 2598 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2264:26: warning: unused variable 'payload' [-Wunused-variable] 2264 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2278:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2278 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ :2563:26: warning: unused variable 'payload' [-Wunused-variable] 2563 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2598:26: warning: unused variable 'payload' [-Wunused-variable] 2598 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2563:26: warning: unused variable 'payload' [-Wunused-variable] 2563 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2598:26: warning: unused variable 'payload' [-Wunused-variable] 2598 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHIn file included from EC/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCIn file included from ollNet->listen(dev, ahtaandlType_t dataType, nccle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm*** mhandle) { NCCLCHECK(comm->ncclCollNetRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:39: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function]->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21 comm, :void* c ollComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ warning: unused function 'collNetDeregMr' [-Wunused-function]/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 25 | static n29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ cclResult_t colIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:39: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:40: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNo 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:40: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2563:26: warning: unused variable 'payload' [-Wunused-variable] 2563 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ lNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollN e16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECKt->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet-des) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(str char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:86:21: warning: unused function 'commReclaim' [-Wunused-function] 86 | static ncclResult_t commReclaim(ncclComm_t comm); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2249:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2249 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ (comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct uct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2598:26: warning: unused variable 'payload' [-Wunused-variable] 2598 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ >closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:39: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:40: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclR | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:86:21: warning: unused function 'commReclaim' [-Wunused-function] 86 | static ncclResult_t commReclaim(ncclComm_t comm); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2249:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2249 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm))e; return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:39: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, insult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~t dev, int* rank) /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h: { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToIn tfloat ncclT(opoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ con/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:40: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float st char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:86:21: warning: unused function 'commReclaim' [-Wunused-function] 86 | static ncclResult_t commReclaim(ncclComm_t comm); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2249:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2249 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:86:21: warning: unused function 'commReclaim' [-Wunused-function] 86 | static ncclResult_t commReclaim(ncclComm_t comm); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2249:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2249 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:39: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:40: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:86:21: warning: unused function 'commReclaim' [-Wunused-function] 86 | static ncclResult_t commReclaim(ncclComm_t comm); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2249:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2249 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; }In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(st | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* lruct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:39: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:40: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct nccIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from istenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:39: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:40: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSet/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->lXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* aAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:86:21: warning: unused function 'commReclaim' [-Wunused-function] 86 | static ncclResult_t commReclaim(ncclComm_t comm); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2249:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2249 | constexpr nvtxPayloadSchemaEntry_t CommInitRankttrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct nSchema[] = { | ^~~~~~~~~~~~~~~~~~ cclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:86:21: warning: unused function 'commReclaim' [-Wunused-function] 86 | static ncclResult_t commReclaim(ncclComm_t comm); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2249:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2249 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:39: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:40: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(strucIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* t nccoclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmmm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListelnNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] (334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:86:21: warning: unused function 'commReclaim' [-Wunused-function] 86 | static ncclResult_t commReclaim(ncclComm_t comm); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2249:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2249 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:39: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:40: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, cIn file included from onst char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:86:21: warning: unused function 'commReclaim' [-Wunused-function] 86 | static ncclResult_t commReclaim(ncclComm_t com/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type,m); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2249:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2249 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:39: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:40: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:86:21: warning: unused function 'commReclaim' [-Wunused-function] 86 | static ncclResult_t commReclaim(ncclComm_t comm); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2249:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2249 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:39: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:40: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:86:21: warning: unused function 'commReclaim' [-Wunused-function] 86 | static ncclResult_t commReclaim(ncclComm_t comm); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init.cc:2249:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2249 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ 57 warnings generated when compiling for gfx1101. 57 warnings generated when compiling for gfx1100. 57 warnings generated when compiling for gfx1201. 57 warnings generated when compiling for gfx906. 57 warnings generated when compiling for gfx1200. 57 warnings generated when compiling for gfx1030. 57 warnings generated when compiling for gfx908. 57 warnings generated when compiling for gfx1102. 57 warnings generated when compiling for gfx942. 57 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ 2 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ 2 warnings generated when compiling for gfx906. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx908. 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for gfx1030. 2 warnings generated when compiling for gfx942. 2 warnings generated when compiling for gfx1100. [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/net.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/net.cc.o -MF CMakeFiles/rccl.dir/hipify/src/net.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/net.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc 57 warnings generated when compiling for host. [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/msccl.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/msccl.cc.o -MF CMakeFiles/rccl.dir/hipify/src/msccl.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/msccl.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for host. 2 warnings generated when compiling for gfx942. 2 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for gfx1030. 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx906. 2 warnings generated when compiling for gfx908. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ [ 47%] Building CXX object CMakeFiles/rccl.dir/hipify/src/proxy.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/proxy.cc.o -MF CMakeFiles/rccl.dir/hipify/src/proxy.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/proxy.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:54:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 54 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:61:19: warning: unused variable 'payload' [-Wunused-variable] 61 | NvtxParamsMsccl payload{count * ncclTypeSize(dataType), op, dataType}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:54:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 54 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:61:19: warning: unused variable 'payload' [-Wunused-variable] 61 | NvtxParamsMsccl payload{count * ncclTypeSize(dataType), op, dataType}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:54:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 54 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:61:19: warning: unused variable 'payload' [-Wunused-variable] 61 | NvtxParamsMsccl payload{count * ncclTypeSize(dataType), op, dataType}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:54:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 54 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:61:19: warning: unused variable 'payload' [-Wunused-variable] 61 | NvtxParamsMsccl payload{count * ncclTypeSize(dataType), op, dataType}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:54:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 54 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:61:19: warning: unused variable 'payload' [-Wunused-variable] 61 | NvtxParamsMsccl payload{count * ncclTypeSize(dataType), op, dataType}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:54:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 54 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:61:19: warning: unused variable 'payload' [-Wunused-variable] 61 | NvtxParamsMsccl payload{count * ncclTypeSize(dataType), op, dataType}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:54:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 54 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:61:19: warning: unused variable 'payload' [-Wunused-variable] 61 | NvtxParamsMsccl payload{count * ncclTypeSize(dataType), op, dataType}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:54:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 54 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:61:19: warning: unused variable 'payload' [-Wunused-variable] 61 | NvtxParamsMsccl payload{count * ncclTypeSize(dataType), op, dataType}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:54:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 54 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:61:19: warning: unused variable 'payload' [-Wunused-variable] 61 | NvtxParamsMsccl payload{count * ncclTypeSize(dataType), op, dataType}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:54:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 54 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:61:19: warning: unused variable 'payload' [-Wunused-variable] 61 | NvtxParamsMsccl payload{count * ncclTypeSize(dataType), op, dataType}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:54:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 54 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:61:19: warning: unused variable 'payload' [-Wunused-variable] 61 | NvtxParamsMsccl payload{count * ncclTypeSize(dataType), op, dataType}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.hIn file included from :10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xmIn file included from l, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx1201. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx1200. 7 warnings generated when compiling for gfx942. 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx90a. 77 warnings generated when compiling for gfx908. warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx1101. [ 47%] Building CXX object CMakeFiles/rccl.dir/hipify/src/rccl_wrap.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/rccl_wrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/rccl_wrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/rccl_wrap.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:289:7: warning: variable 'sublist_len' set but not used [-Wunused-but-set-variable] 289 | int sublist_len = 0; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:289:7: warning: variable 'sublist_len' set but not used [-Wunused-but-set-variable] 289 | int sublist_len = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:289:7: warning: variable 'sublist_len' set but not used [-Wunused-but-set-variable] 289 | int sublist_len = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:289:7: warning: variable 'sublist_len' set but not used [-Wunused-but-set-variable] 289 | int sublist_len = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:289:7: warning: variable 'sublist_len' set but not used [-Wunused-but-set-variable] 289 | int sublist_len = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:289:7: warning: variable 'sublist_len' set but not used [-Wunused-but-set-variable] 289 | int sublist_len = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:289:7: warning: variable 'sublist_len' set but not used [-Wunused-but-set-variable] 289 | int sublist_len = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:289:7: warning: variable 'sublist_len' set but not used [-Wunused-but-set-variable] 289 | int sublist_len = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:289:7: warning: variable 'sublist_len' set but not used [-Wunused-but-set-variable] 289 | int sublist_len = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:289:7: warning: variable 'sublist_len' set but not used [-Wunused-but-set-variable] 289 | int sublist_len = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:289:7: warning: variable 'sublist_len' set but not used [-Wunused-but-set-variable] 289 | int sublist_len = 0; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/proxy.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx942. 3 warnings generated when compiling for gfx1101. 3 warnings generated when compiling for gfx1030. 33 warnings generated when compiling for gfx1100. 3 warnings generated when compiling for gfx1102. 3 warnings generated when compiling for gfx1200. warnings generated when compiling for gfx906. 3 warnings generated when compiling for gfx1201. 3 warnings generated when compiling for gfx90a. 3 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:25: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:25: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:25: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:25: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:25: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:25: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:25: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:25: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:25: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:25: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:25: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ ex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/rccl_wrap.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ 9 warnings generated when compiling for host. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx908. 9 warnings generated when compiling for gfx906. 9 warnings generated when compiling for gfx1030. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx942. [ 47%] Building CXX object CMakeFiles/rccl.dir/hipify/src/register.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/register.cc.o -MF CMakeFiles/rccl.dir/hipify/src/register.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/register.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc 3 warnings generated when compiling for host. [ 47%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx1030. 2 warnings generated when compiling for gfx942. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx1101. 22 warnings generated when compiling for gfx90a. warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx942. 2 warnings generated when compiling for gfx906. 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for gfx906. 2 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for gfx908. 22 warnings generated when compiling for gfx1102. warnings generated when compiling for gfx1030. [ 48%] Building CXX object CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.cu.cpp 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for host. [ 48%] Building CXX object CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 77 | uint32_t y, head, mantissa; | ^ :77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:In file included from 44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx942. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1201. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx1100. 11 warning generated when compiling for gfx1200. warning generated when compiling for gfx942. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx906. 2 warnings generated when compiling for gfx908. [ 48%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx906. 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx1030. 2 warnings generated when compiling for gfx1200. [ 48%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:124:12: warning: unused variable 'y' [-Wunused-variable] 124 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:131:7: warning: unused variable 'localRanks' [-Wunused-variable] 131 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:124:12: warning: unused variable 'y' [-Wunused-variable] 124 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:131:7: warning: unused variable 'localRanks' [-Wunused-variable] 131 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:124:12: warning: unused variable 'y' [-Wunused-variable] 124 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:131:7: warning: unused variable 'localRanks' [-Wunused-variable] 131 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:124:12: warning: unused variable 'y' [-Wunused-variable] 124 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:131:7: warning: unused variable 'localRanks' [-Wunused-variable] 131 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:124:12: warning: unused variable 'y' [-Wunused-variable] 124 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:131:7: warning: unused variable 'localRanks' [-Wunused-variable] 131 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:265:21: warning: unused function 'getIndexes' [-Wunused-function] 265 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:439:21: warning: unused function 'connectNvls' [-Wunused-function] 439 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:124:12: warning: unused variable 'y' [-Wunused-variable] 124 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:131:7: warning: unused variable 'localRanks' [-Wunused-variable] 131 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ :124:12: warning: unused variable 'y' [-Wunused-variable] 124 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:131:7: warning: unused variable 'localRanks' [-Wunused-variable] 131 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:124:12: warning: unused variable 'y' [-Wunused-variable] 124 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:131:7: warning: unused variable 'localRanks' [-Wunused-variable] 131 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:124:12: warning: unused variable 'y' [-Wunused-variable] 124 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:131:7: warning: unused variable 'localRanks' [-Wunused-variable] 131 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:124:12: warning: unused variable 'y' [-Wunused-variable] 124 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:131:7: warning: unused variable 'localRanks' [-Wunused-variable] 131 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:124:12: warning: unused variable 'y' [-Wunused-variable] 124 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:131:7: warning: unused variable 'localRanks' [-Wunused-variable] 131 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:265:21: warning: unused function 'getIndexes' [-Wunused-function] 265 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:439:21: warning: unused function 'connectNvls' [-Wunused-function] 439 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:265:21: warning: unused function 'getIndexes' [-Wunused-function] 265 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:439:21: warning: unused function 'connectNvls' [-Wunused-function] 439 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:265:21: warning: unused function 'getIndexes' [-Wunused-function] 265 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:439:21: warning: unused function 'connectNvls' [-Wunused-function] 439 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:265:21: warning: unused function 'getIndexes' [-Wunused-function] 265 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:439:21: warning: unused function 'connectNvls' [-Wunused-function] 439 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:265:21: warning: unused function 'getIndexes' [-Wunused-function] 265 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:439:21: warning: unused function 'connectNvls' [-Wunused-function] 439 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:265:21: warning: unused function 'getIndexes' [-Wunused-function] 265 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:439:21: warning: unused function 'connectNvls' [-Wunused-function] 439 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:265:21: warning: unused function 'getIndexes' [-Wunused-function] 265 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:439:21: warning: unused function 'connectNvls' [-Wunused-function] 439 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:265:21: warning: unused function 'getIndexes' [-Wunused-function] 265 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:439:21: warning: unused function 'connectNvls' [-Wunused-function] 439 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | sta{ | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:265:21: warning: unused function 'getIndexes' [-Wunused-function] 265 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:439:21: warning: unused function 'connectNvls' [-Wunused-function] 439 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ tic bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:265:21: warning: unused function 'getIndexes' [-Wunused-function] 265 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/connect.cc:439:21: warning: unused function 'connectNvls' [-Wunused-function] 439 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ 13 warnings generated when compiling for gfx1100. 13 warnings generated when compiling for gfx906. 13 warnings generated when compiling for gfx1201. 13 warnings generated when compiling for gfx908. 13 warnings generated when compiling for gfx1101. 13 warnings generated when compiling for gfx942. 13 warnings generated when compiling for gfx1030. 13 warnings generated when compiling for gfx1200. 13 warnings generated when compiling for gfx1102. 13 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 13 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:275:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 275 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:275:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 275 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:275:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 275 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:462:24: warning: unused variable 'gpu' [-Wunused-variable] 462 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:462:24: warning: unused variable 'gpu' [-Wunused-variable] 462 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:462:24: warning: unused variable 'gpu' [-Wunused-variable] 462 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ [ 49%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rings.cc /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:275:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 275 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:275:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 275 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:462:24: warning: unused variable 'gpu' [-Wunused-variable] 462 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:462:24: warning: unused variable 'gpu' [-Wunused-variable] 462 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:275:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 275 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:275:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 275 | int intermediateIndex = -1; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, c/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:462:24: warning: unused variable 'gpu' [-Wunused-variable] 462 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node,static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:462:24: warning: unused variable 'gpu' [-Wunused-variable] 462 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ onst int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:275:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 275 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:462:24: warning: unused variable 'gpu' [-Wunused-variable] 462 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:275:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 275 | int intermediateIndex = -1; | ^ :275:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 275 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:275:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 275 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:462:24: warning: unused variable 'gpu' [-Wunused-variable] 462 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ :462:24: warning: unused variable 'gpu' [-Wunused-variable] 462 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:462:24: warning: unused variable 'gpu' [-Wunused-variable] 462 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXml254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ Node** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/paths.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 31 warnings generated when compiling for gfx1100. 31 warnings generated when compiling for gfx90a. 31 warnings generated when compiling for gfx1201. 31 warnings generated when compiling for gfx1030. 31 warnings generated when compiling for gfx906. 31 warnings generated when compiling for gfx942. 31 warnings generated when compiling for gfx1101. 31 warnings generated when compiling for gfx908. 31 warnings generated when compiling for gfx1102. 31 warnings generated when compiling for gfx1200. 31 warnings generated when compiling for host. [ 49%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx1201. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx942. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1200. [ 49%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1341:7: warning: unused variable 'nChannels' [-Wunused-variable] 1341 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1351:12: warning: unused variable 'y' [-Wunused-variable] 1351 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1341:7: warning: unused variable 'nChannels' [-Wunused-variable] 1341 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1351:12: warning: unused variable 'y' [-Wunused-variable] 1351 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1341:7: warning: unused variable 'nChannels' [-Wunused-variable] 1341 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1351:12: warning: unused variable 'y' [-Wunused-variable] 1351 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1341:7: warning: unused variable 'nChannels' [-Wunused-variable] 1341 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1351:12: warning: unused variable 'y' [-Wunused-variable] 1351 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1858:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1858 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1930:9: warning: unused variable 't' [-Wunused-variable] 1930 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1858:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1858 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1930:9: warning: unused variable 't' [-Wunused-variable] 1930 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ :2036:7: warning: unused variable 'ncpus' [-Wunused-variable] 2036 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2130:9: warning: unused variable 't' [-Wunused-variable] 2130 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1858:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1858 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1930:9: warning: unused variable 't' [-Wunused-variable] 1930 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2240:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 2240 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2316:9: warning: unused variable 't' [-Wunused-variable] 2316 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1858:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1858 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1930:9: warning: unused variable 't' [-Wunused-variable] 1930 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2036:7: warning: unused variable 'ncpus' [-Wunused-variable] 2036 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2130:9: warning: unused variable 't' [-Wunused-variable] 2130 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1341:7: warning: unused variable 'nChannels' [-Wunused-variable] 1341 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1351:12: warning: unused variable 'y' [-Wunused-variable] 1351 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2240:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 2240 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2316:9: warning: unused variable 't' [-Wunused-variable] 2316 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_us/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2036:7: warning: unused variable 'ncpus' [-Wunused-variable] 2036 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2130:9: warning: unused variable 't' [-Wunused-variable] 2130 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2036:7: warning: unused variable 'ncpus' [-Wunused-variable] 2036 | int ncpus = system->nodes[CPU].count; | ^~~~~ ec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2130:9: warning: unused variable 't' [-Wunused-variable] 2130 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1341:7: warning: unused variable 'nChannels' [-Wunused-variable] 1341 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1351:12: warning: unused variable 'y' [-Wunused-variable] 1351 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2240:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 2240 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2316:9: warning: unused variable 't' [-Wunused-variable] 2316 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2240:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 2240 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2316:9: warning: unused variable 't' [-Wunused-variable] 2316 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1341:7: warning: unused variable 'nChannels' [-Wunused-variable] 1341 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1351:12: warning: unused variable 'y' [-Wunused-variable] 1351 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1341:7: warning: unused variable 'nChannels' [-Wunused-variable] 1341 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1351:12: warning: unused variable 'y' [-Wunused-variable] 1351 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1341:7: warning: unused variable 'nChannels' [-Wunused-variable] 1341 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1351:12: warning: unused variable 'y' [-Wunused-variable] 1351 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1858:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1858 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1930:9: warning: unused variable 't' [-Wunused-variable] 1930 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1341:7: warning: unused variable 'nChannels' [-Wunused-variable] 1341 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1351:12: warning: unused variable 'y' [-Wunused-variable] 1351 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1858:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1858 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1930:9: warning: unused variable 't' [-Wunused-variable] 1930 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv:2036:7: warning: unused variable 'ncpus' [-Wunused-variable] 2036 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2130:9: warning: unused variable 't' [-Wunused-variable] 2130 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ _usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1341:7: warning: unused variable 'nChannels' [-Wunused-variable] 1341 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1351:12: warning: unused variable 'y' [-Wunused-variable] 1351 | int x=0, y=0; | ^ :2240:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 2240 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2316:9: warning: unused variable 't' [-Wunused-variable] 2316 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1858:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1858 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1930:9: warning: unused variable 't' [-Wunused-variable] 1930 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2036:7: warning: unused variable 'ncpus' [-Wunused-variable] 2036 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2130:9: warning: unused variable 't' [-Wunused-variable] 2130 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1858:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1858 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1930:9: warning: unused variable 't' [-Wunused-variable] 1930 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ :2240:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 2240 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2036:7: warning: unused variable 'ncpus' [-Wunused-variable] 2036 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2130:9: warning: unused variable 't' [-Wunused-variable] 2130 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2316:9: warning: unused variable 't' [-Wunused-variable] 2316 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1858:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1858 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1930:9: warning: unused variable 't' [-Wunused-variable] 1930 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2240:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 2240 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2316:9: warning: unused variable 't' [-Wunused-variable] 2316 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2036:7: warning: unused variable 'ncpus' [-Wunused-variable] 2036 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2130:9: warning: unused variable 't' [-Wunused-variable] 2130 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1858:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1858 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1930:9: warning: unused variable 't' [-Wunused-variable] 1930 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2036:7: warning: unused variable 'ncpus' [-Wunused-variable] 2036 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2130:9: warning: unused variable 't' [-Wunused-variable] 2130 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:27: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode*/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2240:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 2240 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2316:9: warning: unused variable 't' [-Wunused-variable] 2316 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1858:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1858 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:1930:9: warning: unused variable 't' [-Wunused-variable] 1930 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2240:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 2240 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2316:9: warning: unused variable 't' [-Wunused-variable] 2316 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2036:7: warning: unused variable 'ncpus' [-Wunused-variable] 2036 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2130:9: warning: unused variable 't' [-Wunused-variable] 2130 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2036:7: warning: unused variable 'ncpus' [-Wunused-variable] 2036 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2130:9: warning: unused variable 't' [-Wunused-variable] 2130 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:27: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int:2240:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 2240 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2316:9: warning: unused variable 't' [-Wunused-variable] 2316 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ * value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNodeIn file included from * /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.ccp:a23r: eIn file included from n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.ht:N38o: dIn file included from e/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h,: 14s: t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.hr:u44c:t13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:27: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDiIn file included from ct/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc*: 23d: iIn file included from c/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.ht:)38 : {In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h :| 14 ^~~~~~~~~~~~~~: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h44::13390:: 21warning: : unused function 'log2i' [-Wunused-function]warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | s t44a | tsitca tnicccl Rleosnugl tl_otg 2kiv(Cloonnvge rnt)T o{S t r| ( ^~~~~in t value, cIn file included from o/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.ccn:s26t: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.hc:h226a:r21*:* warning: sunused function 'ncclTopoRankToIndex' [-Wunused-function]t r, struct 226k | vDsitcatt*i cd incctc)l R{e s u| l ^~~~~~~~~~~~~~t _t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:27: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2240:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 2240 | int g ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64cnt = 0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:2316:9: warning: unused variable 't' [-Wunused-variable] 2316 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ _t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:27: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:27: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResultIn file included from _t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | statIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:27: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclReic float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:27: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21:s ult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(structwarning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(s ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmltruct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNSoetAttrLong(struct ncclXmlNode* node, const char* atde* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | trName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, static ncclResult_t xmlGetAttrIntDefaulstruct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ t(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct nIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t icclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float*d, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:27: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNod) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ne* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclRecclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ sult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:27: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) In file included from { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclRes/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:26: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] u lt_t xmlS226etAt | trInst(sttructa ncctlXmliNodce* n ode,n concst cchar*lResult_t ncclTopoRankT attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResuloItndex_(t xmlSetAttrFstrulct nocclTaopoStyst(em* ssysttem, rint urankc, intt* in dex)ncclXmlNode* n{ o| ^~~~~~~~~~~~~~~~~~~ d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.he:237:21,: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] c237 | statioc ncnst clResult_t ncclTopoDevToRank(struct ncclTopochSar*y atstrNtamee, cmons*t f loast vyastem, int dev,lue ) {i | n ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.ht:254:*21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] r 254a | stnatikc nc)clR esu{lt_ t x mlS| e ^~~~~~~~~~~~~~~~~ tAttrLong(s/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.ht:249:r21: uwarning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249ct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | st | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | satitc naccltResuilt_ct x mlUfnloat ncclTopoNVLinkBw(int cudaCompCap)setAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResul {t | _ ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.ht:283 :13:x warning: unused function 'isPow2' [-Wunused-function]m l283 | sGtateic tboolS isuPowb2(i(nt svalt) {r uct ncclXmlNode* node, const ch| a ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.hr:286*:12: warning: unused function 'mirrorBits' [-Wunused-function]s u286 | sbtatNic iant mmirero,rBi ts(sintt varluc, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/rome_models.cc:27: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml**t ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName xm,l, ints maxNodes)t { r | ^~~~~~~~ u/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21c: warning: tunused function 'xmlGetAttrInt' [-Wunused-function] 111 | static nnccclRecsullt_tX xmmllNode** sub, const char* attrNaGemtAtetrI,nt( stcrucotn nscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function]t int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct n 118 | static ncclResult_t xmlGetAttrInctclXml* dstDefault(struct , struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 38 warnings generated when compiling for gfx1101. 38 warnings generated when compiling for gfx1201. 38 warnings generated when compiling for gfx1100. 38 warnings generated when compiling for gfx1200. 38 warnings generated when compiling for gfx908. 38 warnings generated when compiling for gfx1102. 38 warnings generated when compiling for gfx942. 38 warnings generated when compiling for gfx906. 38 warnings generated when compiling for gfx90a. 38 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.hNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const :125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ char* subName, struct/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h :140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t x/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parentmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node,, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, constIn file included from char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc n:cc10lRe: suIn file included from lt_t x/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.hml:Fi13n: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.hd:No15de: (In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14st: r/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.huct: ncclXml44:13N: ode* parentNode, struct ncclXwarning: unused function 'log2i' [-Wunused-function]m l44 | Nsotadet*ic lsoneg log2ai(rlocnhg Nn) { o| ^~~~~d In file included from e,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc: 13s: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.ht:262ruc:t14 ncclXmlNode** no: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const cdeh) a{ | r ^~~~~~~~~~~* /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h :g216:c21:n warning: )unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | st{at ic n| cc ^~~~~~~~~~~~~~~~~lR es/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.hult_:t 272xm:lS14et:At trwarning: Ifunused function 'ncclTopoNVLinkBw' [-Wunused-function]Un se272t | (ssttartuicct fnlcocaltX mnlcNcoldTeo*p onNoVdLei,n kcBown(sitn tc hcaurd*a CaotmtprCNaapm)e ,{ c o| n ^~~~~~~~~~~~~~~~s t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h ch:a283r:* v13a:l uwarning: eunused function 'isPow2' [-Wunused-function]) { 283 | | s ^~~~~~~~~~~~~~~~~t a/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.hti:267:c21 :b owarning: unused function 'xmlUnsetAttr' [-Wunused-function] ol267 | isstPaotw2i(c innctc lvRaels)u l{t _ t| ^~~~~~x m/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.hlUn:s286e:t12A: warning: unused function 'mirrorBits' [-Wunused-function]t t r(286 | sstrtuactti cn ccliXnmtlNo dmei*r rnoorBidtes,( icnonstt cvhaalr,* ianttt proNwa2m)e ){ { | ^~~~~~~~~~| ^~~~~~~~~~~~In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc::15279: :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h21::118 :warning: 21unused function 'xmlGetSub' [-Wunused-function]: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function]279 | st118at | isct antcicclR enscuclltR_ets uxlmtl_Gte txSmulbG(esttArtutctrI nntcDcelfXamulNlto(dset* rnuocdte , cnocncsltX mclNohdaer* *n osduebN,a mceo,n sstt rcuhcatr *n cactltXrmNlaNmoed,e *i*n ts*u bva) {l u e| , ^~~~~~~~~ i/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.hnt: 305d:e21f:a uwarning: lunused function 'xmlGetSubKvInt' [-Wunused-function]t V alu305e | )s t{a t i| c ^~~~~~~~~~~~~~~~~~~~ n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.hcc:125lRe:s21u:l twarning: _unused function 'xmlGetAttrLong' [-Wunused-function]t x125ml | GsettaStiucb KnvcIcnltR(essturlutc_tt nxcmcllGXemtlANtotdreL*o nngo(dset,r uccotn sntc cclhXamrl*N osdueb*N anmeo,d es,t rcuocnts tn ccchlaXrm*l Naotdter*N*a smueb,, i ncotn6s4t_ tc*h avra*l uaet)t r{N a me,| ^~~~~~~~~~~~~~c o/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.hns:t140 :i21n:t warning: aunused function 'xmlFindTag' [-Wunused-function]t t rV140a | lstuaet)i c{ nc| c ^~~~~~~~~~~~~~l /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.hRes:334u:l21t:_ twarning: unused function 'xmlRemoveNode' [-Wunused-function]x m lF334i | nsdtTaatgi(cs tnrcuccltR enscuclltX_mtl *x mxlmRle,m oconvsetN ocdhea(rs*t rtuacgtN amnec,c lsXtmrluNcotd en*c cnloXdem)l N{ o| d ^~~~~~~~~~~~~e */builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h*: n347o:21d:e )warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration]{ | 347 ^~~~~~~~~~ | s /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.ht:a152:21:t iwarning: cunused function 'xmlFindNextTag' [-Wunused-function] n ccl152R | esstualtti_ct nxcmcllARddeTsruelet(s_ttr uxcmtl FnicncdlNXemxlt*T adgs(ts,t rsutruct ncclXmlNode* parect nccnt, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ lXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, consIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLint char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ kBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* nodIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static e, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode*n cclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKnode, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_vIntt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/search.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ 18 warnings generated when compiling for gfx1030. 18 warnings generated when compiling for gfx942. 18 warnings generated when compiling for gfx1100. 18 warnings generated when compiling for gfx1200. 18 warnings generated when compiling for gfx90a. 18 warnings generated when compiling for gfx1201. 18 warnings generated when compiling for gfx908. 18 warnings generated when compiling for gfx1101. 18 warnings generated when compiling for gfx1102. 18 warnings generated when compiling for gfx906. 38 warnings generated when compiling for host. [ 49%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc 18 warnings generated when compiling for host. [ 50%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/trees.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrVIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) {alue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNo | ^~~~~d In file included from e/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:11: ,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] s237 | sttatic ncclResult_ruct ncclXmlNode* searchNode, struct ncclt XncclTmopoDelvToRanNk(struoct ncdclTopeoSyst*em* s*ystem , node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | statint dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(sic ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_ttr uct nxcclTompoSlystem*S sysetem, tint64A_t id,t int*t netDrev) {I | ^~~~~~~~~~~~~~~~~~ f/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14U: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] n272 | stsatic efloatt nccl(TopoNVsLinkBtw(int ruct ncclXmlNode* nodcudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetNae, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* amet(strutct nccrlCommN* acomm)m { reeturn c,omm-> ncclCcollNeto->namne; } s| ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.ht:19:21 : warning: unused function 'collNetListen' [-Wunused-function] f 19 | sltaticoat value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254 ncclResult_t collNetListen(struct ncclComm* comm, int dev, vo:21: iwarning: unused function 'xmlSetAttrLong' [-Wunused-function] d 254* | shtataic nnccdlRelsulet_t xm,lS void** letAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(sisttenrComum) c{ NtCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm nc*clX mlNcodeo* nmodem, c,ons t char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const vcoidh* haandrle*s[] , isnt nuranbks,N iantm reank,, vo ids* ltisternCoumm, cvoitd* * cnollcComcm) {l NCXCLCmHEClK(Ncomom->dnccelCo*llN*et-> consnecut(hbandles, nranks, rank, listenComm, collComm)); return ncclSu, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(stccerss;u } c | ^~~~~~~~~~~~~~t /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h :21:n21: cwarning: unused function 'collNetReduceSupport' [-Wunused-function] c l21 | sXtatmic lnccNlReosuldt_et c*oll NetnReduoceSduppeort)(st ruc{t n cc | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTreelComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclC(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict*ol lNedt->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* daitct)a {, | ^~~~~~~~~~~~~~ size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode*ev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static n}c | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle));clResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t colNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, constwarning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmllSlNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { etAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, coNnCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: st char* attrunused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* cName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | sollComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comtatic ncclResult_t xmlSetAttrLon gchar* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ (struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: m->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclColunused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclRleNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: sult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclwarning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struXml* dst, struct ncclXmlNct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* nodode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: eunused function 'kvConvertToStr' [-Wunused-function], const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAtt 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ r(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->lIn file included from i/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, nccsten(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, lRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.hnranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* suppo:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ rted) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIfl30ush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->nccl warnings generated when compiling for gfx1030. CollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 30 warnings generated when compiling for gfx1200. 30 warnings generated when compiling for gfx942. 30 warnings generated when compiling for gfx906. 30 warnings generated when compiling for gfx1201. 30 warnings generated when compiling for gfx1102. 30 warnings generated when compiling for gfx1100. 30 warnings generated when compiling for gfx908. 30 warnings generated when compiling for gfx90a. 30 warnings generated when compiling for gfx1101. [ 50%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc 30 warnings generated when compiling for host. [ 50%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:3: warning: nested designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:17: warning: array designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:3: warning: nested designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:17: warning: array designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:354:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 354 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:355:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 355 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:356:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 356 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:357:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 357 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:360:9: warning: unused variable 'ppn' [-Wunused-variable] 360 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:354:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 354 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:355:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 355 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:356:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 356 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:357:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 357 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:360:9: warning: unused variable 'ppn' [-Wunused-variable] 360 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:648:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 648 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint3/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ 2_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:648:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 648 | static float treeCorrectionIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ , mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ Factor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:3: warning: nested designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:17: warning: array designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:3: warning: nested designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:17: warning: array designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:354:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 354 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:355:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 355 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:356:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 356 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:357:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 357 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:360:9: warning: unused variable 'ppn' [-Wunused-variable] 360 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:354:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 354 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:355:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 355 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:356:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 356 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:357:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 357 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:360:9: warning: unused variable 'ppn' [-Wunused-variable] 360 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:3: warning: nested designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:17: warning: array designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINE:354:10D: warning: unused variable 'llMaxBw' [-Wunused-variable] 354 | doubl0e llMaxBw = llMaxBws [index1]| [index2]; ^ | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc: 355:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc355 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:356:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 356 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:357:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 357 | double perChMaxTreeLL128Bw = perChMaxTree:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ LL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:360:9: warning: unused variable 'ppn' [-Wunused-variable] 360 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:3: warning: nested designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:12: *ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:17: warning: array designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:648:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 648 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llPcudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:648:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 648 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ rotoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINE ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LID}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ MITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoR:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] a 139 | n .llPrgotoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIMITes = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ S_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #de/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_Lfine RCCL_LL_LIMITS_UNDEFINED 0 | ^ IMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ :107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_U/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:354:10: warning: unused variable 'llMaxBw' [-Wunused-variable] NDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRa354 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:355:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 355 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:356:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 356 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:357:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 357 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:360:9: warning: unused variable 'ppn' [-Wunused-variable] 360 | floatnges = {RCCL_LL_LIMITS_UNDEF ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | ./builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.ccllProtoRanges:171:21 : warning: suggest braces around initialization of subobject [-Wmissing-braces] =171 | I .NED},{l | ^~~~~~~~~~~~~~~~~~~~~~~~ Rl | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.hCP:CL_LL_LIMITS_UNDEFrotoRIanges N= {RCCEL_LL35:D_34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED'L} 35 | #,Idefin Me RCCIL_LL_LT IMITS_SUNDEFI_NED 0 U | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.ccNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIM| ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIITMS_UNIDEFITNED S0 _ | ^ U/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.ccN:D171:21:E warning: suggest braces around initialization of subobject [-Wmissing-braces] F 171 | I N.llPErotoRDan}ges ,= {R CCL_ LL| ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ :139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_ L | ^ I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.ccMITS_UND/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.ccEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 :203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRan| ^ g/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cces = {RCCL_LL_LIMITS_UNDEFINED}, :171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEF | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:INED34}, :| ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.hnote: :35:expanded from macro 'RCCL_LL_LIMITS_UNDEFINED'34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #defi35ne R | CC#L_LL_dLIMeITS_UfNDEFiINEDn 0 e:| 171: ^21:R warning: suggest braces around initialization of subobject [-Wmissing-braces] CCL_LL_LIMITS_UN 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #de/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_Lfine RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.ccDEFINED 0IMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:3: warning: nested designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:17: warning: array designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35::235:2134: warning: suggest braces around initialization of subobject [-Wmissing-braces]: 235 | .llProtoRanote: ngesexpanded from macro 'RCCL_LL_LIMITS_UNDEFINED' = { RCCL _LL_LIM35ITS | _U#NDEFdIefine RNECD},C | ^~~~~~~~~~~~~~~~~~~~~~~~ L_LL_LIMITS_UND | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.hE:35:F34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED'I 35N | ED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llP#define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINErotoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIM/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.ccITS_UNDEFINED: 203:21:0 warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .ll| Prot ^oRan ges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFDI}, N| ^~~~~~~~~~~~~~~~~~~~~~~~ E| { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.hD:35:34 : note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED'0 35 | # defi| ne R ^CCL_ LL_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.ccLIMITS_UNDEFINED 0 | ^: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | :267:3: warning: nested designators are a C99 extension [-Wc99-designator] 267 | .llP .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ rotoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:17: warning: array designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llP/*RreduoceStcatoterR*/ {/* LL a(Minn/Mgax)e *s/ { 0, =655 360, 1{} ,R /C* LCL12L8 (_MinL/MaLx) _*/ L{13I107M2, I321T126S4, _1}}/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:3: warning: nested designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:17: warning: array designators are a C99 extension [-Wc99-designator] 267 | .llPU, N| ^~~~~~~~~~~~~~~~~ DEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ rotoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:3: warning: nested designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:17: warning: array designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:354:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 354 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:355:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 355 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:356:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 356 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:357:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 357 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:360:9: warning: unused variable 'ppn' [-Wunused-variable] 360 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving a/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cct the same GPU through the NIC, apply some bw discount | ^~~ :354:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 354 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:355:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 355 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:356:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 356 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:357:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 357 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:360:9: warning: unused variable 'ppn' [-Wunused-variable] 360 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:354:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 354 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:355:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 355 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:356:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 356 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:357:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 357 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCap/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] Ind 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:107:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 107 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ ex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:360:9: warning: unused variable 'ppn' [-Wunused-variable] 360 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:354:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 354 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:355:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 355 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:356:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 356 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:357:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 357 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:360:9: warning: unused variable 'ppn' [-Wunused-variable] 360 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:139:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 139 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:171:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 171 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINunused function 'isPow2' [-Wunused-function] 283 | sED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:203:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 203 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ tatic bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:648:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 648 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:235:21: warning: suggest braces around initialization of subobject [-Wmissing-braces] 235 | .llProtoRanges = {RCCL_LL_LIMITS_UNDEFINED}, | ^~~~~~~~~~~~~~~~~~~~~~~~ | { } /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_common.h:35:34: note: expanded from macro 'RCCL_LL_LIMITS_UNDEFINED' 35 | #define RCCL_LL_LIMITS_UNDEFINED 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:3: warning: nested designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:267:17: warning: array designators are a C99 extension [-Wc99-designator] 267 | .llProtoRanges[RCCL_RS_TUNABLE] = /*ReduceScatter*/ {/* LL (Min/Max) */ {0, 655360, 1} , /* LL128 (Min/Max) */ {131072, 3211264, 1}}, | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:648:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 648 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:354:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 354 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:355:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 355 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:356:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 356 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:357:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 357 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:360:9: warning: unused variable 'ppn' [-Wunused-variable] 360 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTop:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopooSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSysStysteem* sysmtem,* int64 _t ids, int* nyetDev)s { tem, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~| ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h :262:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.hwarning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | stat:ic flo237at nc:21clTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cud: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* aCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:648:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 648In file included from | sta/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:t12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21i: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] c215 | stat ic ncclfResultl_t nccolTsysoatem, ptint64 o_t idI,t intd*r netTDeev) o{e | ^~~~~~~~~~~~~~~~~~ IC/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14on: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] rd 262 | erstatixec flo(cat ncsctlTopotXiGonFacructt ncMISopeecd(r[NCCLlTopoSystem* system, int cotnst chyar* gcpn) { e| ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:,272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function]int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 272 | s tatic float ncclTo226poNVL | inkBw(sint cudtaComatic nccpCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ lResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t n:c283:13:c warning: unused function 'isPow2' [-Wunused-function] l 283 | sTtatico bopol iosPow2D(inte valv) { T | ^~~~~~ o/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:R12: warning: aunused function 'mirrorBits' [-Wunused-function] n286 | stkatic (int smirrtorBirts(iunt vacl, itnt p ow2)n { c| ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.ccc:648l:14: Twarning: unused variable 'treeCorrectionFactor' [-Wunused-variable] o648 | stpatico floSat ytreseCtorreectiomnF*acto r[NCCsLystem, int dev, int*_NUM_PROTOCOLS][23] = { rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t | n ^~~~~~~~~~~~~~~~~~~~ cclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:648:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 648 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:648:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 648 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:12: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/tuning.cc:648:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 648 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ 27 warnings generated when compiling for gfx942. 27 warnings generated when compiling for gfx90a. 27 warnings generated when compiling for gfx906. 27 warnings generated when compiling for gfx1030. 27 warnings generated when compiling for gfx1101. 27 warnings generated when compiling for gfx1200. 27 warnings generated when compiling for gfx1201. 27 warnings generated when compiling for gfx908. 27 warnings generated when compiling for gfx1100. 27 warnings generated when compiling for gfx1102. 27 warnings generated when compiling for host. [ 50%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const chamlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ r* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(10s warnings generated when compiling for gfx90a. truct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.cc:17: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for host. [ 50%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/archinfo.cc /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:105:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 105 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:103:13: warning: unused variable 'ret_domain' [-Wunused-variable] 103 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:105:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 105 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:103:13: warning: unused variable 'ret_domain' [-Wunused-variable] 103 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:105:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 105 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:103:13: warning: unused variable 'ret_domain' [-Wunused-variable] 103 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:233:22: warning: unused variable 'hops' [-Wunused-variable] 233 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:70:14: warning: unused variable 'count' [-Wunused-variable] 70 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:105:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 105 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:103:13: warning: unused variable 'ret_domain' [-Wunused-variable] 103 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:105:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 105 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:105:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 105 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || :103:13: warning: unused variable 'ret_domain' [-Wunused-variable] 103 | iret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! nt ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:103:13: warning: unused variable 'ret_domain' [-Wunused-variable] 103 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:105:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 105 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! :105:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 105 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || re/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cct_unique:105:_33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] id != 0 105 | | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc| ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_:103:13: warning: unused variable 'ret_domain' [-Wunused-variable] 103 | int ret_domain = read_node_properties(node_id, "domain", &domain, propertievendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.ccs); | ^~~~~~~~~~ :103:13: warning: unused variable 'ret_domain' [-Wunused-variable] 103/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc | : 103:13: warning: unused variable 'ret_domain' [-Wunused-variable] 103 | int r /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cce:233:22: warning: unused variable 'hops' [-Wunused-variable] 233 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:70:14: warning: unused variable 'count' [-Wunused-variable] 70 | uint32_t count = 0; | ^~~~~ t_doma in = reiad_noden_propertties(node_id, "dom ain", &dromain, eprotperties); | ^~~~~~~~~~ _domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:233:22: warning: unused variable 'hops' [-Wunused-variable] 233 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:70:14: warning: unused variable 'count' [-Wunused-variable] 70 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:233:22: warning: unused variable 'hops' [-Wunused-variable] 233 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:70:14: warning: unused variable 'count' [-Wunused-variable] 70 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:233:22: warning: unused variable 'hops' [-Wunused-variable] 233 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:70:14: warning: unused variable 'count' [-Wunused-variable] 70 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:233:22: warning: unused variable 'hops' [-Wunused-variable] 233 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:70:14: warning: unused variable 'count' [-Wunused-variable] 70 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:233:22: warning: unused variable 'hops' [-Wunused-variable] 233 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:70:14: warning: unused variable 'count' [-Wunused-variable] 70 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:233:22: warning: unused variable 'hops' [-Wunused-variable] 233 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:70:14: warning: unused variable 'count' [-Wunused-variable] 70 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:233:22: warning: unused variable 'hops' [-Wunused-variable] 233 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:70:14: warning: unused variable 'count' [-Wunused-variable] 70 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:105:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 105 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:103:13: warning: unused variable 'ret_domain' [-Wunused-variable] 103 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:105:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 105 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:103:13: warning: unused variable 'ret_domain' [-Wunused-variable] 103 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:233:22: warning: unused variable 'hops' [-Wunused-variable] 233 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:70:14: warning: unused variable 'count' [-Wunused-variable] 70 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:233:22: warning: unused variable 'hops' [-Wunused-variable] 233 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:70:14: warning: unused variable 'count' [-Wunused-variable] 70 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:52:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 52 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:559:13: warning: unused function 'fileExists' [-Wunused-function] 559 | static bool fileExists(char const *filename) | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:52:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 52 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:559:13: warning: unused function 'fileExists' [-Wunused-function] 559 | static bool fileExists(char const *filename) | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:52:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 52 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:559:13: warning: unused function 'fileExists' [-Wunused-function] 559 | static bool fileExists(char const *filename) | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:52:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 52 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:559:13: warning: unused function 'fileExists' [-Wunused-function] 559 | static bool fileExists(char const *filename) | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:52:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 52 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:559:13: warning: unused function 'fileExists' [-Wunused-function] 559 | static bool fileExists(char const *filename) | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:52:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 52 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:559:13: warning: unused function 'fileExists' [-Wunused-function] 559 | static bool fileExists(char const *filename) | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:52:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 52 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:559:13: warning: unused function 'fileExists' [-Wunused-function] 559 | static bool fileExists(char const *filename) | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:52:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 52 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:559:13: warning: unused function 'fileExists' [-Wunused-function] 559 | static bool fileExists(char const *filename) | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:52:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 52 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:559:13: warning: unused function 'fileExists' [-Wunused-function] 559 | static bool fileExists(char const *filename) | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:52:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 52 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:559:13: warning: unused function 'fileExists' [-Wunused-function] 559 | static bool fileExists(char const *filename) | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:52:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 52 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:559:13: warning: unused function 'fileExists' [-Wunused-function] 559 | static bool fileExists(char const *filename) | ^~~~~~~~~~ 6 warnings generated when compiling for gfx1200. 6 warnings generated when compiling for gfx906. 6 warnings generated when compiling for gfx1101. 6 warnings generated when compiling for gfx1030. 6 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for gfx942. 6 warnings generated when compiling for gfx908. 6 warnings generated when compiling for gfx1201. 6 warnings generated when compiling for gfx1102. 6 warnings generated when compiling for gfx1100. [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 6 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/api_trace.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/api_trace.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/api_trace.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/api_trace.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/api_trace.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx1030. 2 warnings generated when compiling for gfx906. 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx942. 2 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for gfx908. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1101. [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvsymbols.cc In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from 1 warning generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. 1 warning generated when compiling for gfx1100. 11 warning generated when compiling for gfx1200. warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx1201. 1 warning generated when compiling for gfx1030. 11 warning generated when compiling for gfx1200. warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx942. [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvwrap.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx1201. 1 warning generated when compiling for gfx908. [ 52%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ipcsocket.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx1201. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 1In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h: warning generated when compiling for gfx110044. :13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ [ 52%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. 1 warning generated when compiling for gfx1201. 1 warning generated1 warning generated when compiling for gfx1102. when compiling for gfx1200. 1 warning generated when compiling for gfx942. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx906. [ 52%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/nvmlwrap_stub.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ [ 52%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/param.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx942. 2 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for gfx908. 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx906. 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx1030. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for host. [ 53%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc [ 53%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/proxy.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/info.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx1030. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx906. 2 warnings generated when compiling for gfx942. 2 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx908. 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx1102. [ 53%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocmwrap.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1200. 11 warning generated when compiling for gfx942. warning generated when compiling for gfx908. 1 warning generated when compiling for gfx1201. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx1100. [ 53%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/roctx.cc [ 54%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx942. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for host. 11 warning generated when compiling for gfx908. warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx1200. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ [ 54%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/signals.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissaIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ ; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/shmutils.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx906. 2 warnings generated when compiling for gfx908. 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1030. 2 warnings generated when compiling for gfx942. 2 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx1100. [ 54%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc [ 54%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/strongstream.cc /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:602:8: warning: unused variable 'line' [-Wunused-variable] 602 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:602:8: warning: unused variable 'line' [-Wunused-variable] 602 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:602:8: warning: unused variable 'line' [-Wunused-variable] 602 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:602:8: warning: unused variable 'line' [-Wunused-variable] 602 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:602:8: warning: unused variable 'line' [-Wunused-variable] 602 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:602:8: warning: unused variable 'line' [-Wunused-variable] 602 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:602:8: warning: unused variable 'line' [-Wunused-variable] 602 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:602:8: warning: unused variable 'line' [-Wunused-variable] 602 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:602:8: warning: unused variable 'line' [-Wunused-variable] 602 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:602:8: warning: unused variable 'line' [-Wunused-variable] 602 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:602:8: warning: unused variable 'line' [-Wunused-variable] 602 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/socket.cc:9: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx906. 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx942. 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx1030. 2 warnings generated when compiling for gfx908. 2 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for host. [ 55%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc [ 55%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/utils.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/tuner.cc:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/tuner.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for gfx1030. 2 warnings generated when compiling for gfx942. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx908. 2 warnings generated when compiling for gfx906. 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx1102. [ 55%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1201. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx1200. 1 warning generated when compiling for gfx942. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1030. [ 55%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | ead , mantissa; | u ^ int32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | ead, mantissa; | ^ uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:517:10: warning: unused variable 'nBytes' [-Wunused-variable] 517 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:517:10: warning: unused variable 'nBytes' [-Wunused-variable] 517 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:517:10: warning: unused variable 'nBytes' [-Wunused-variable] 517 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:517:10: warning: unused variable 'nBytes' [-Wunused-variable] 517 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ :517:10: warning: unused variable 'nBytes' [-Wunused-variable] 517 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:517:10: warning: unused variable 'nBytes' [-Wunused-variable] 517 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:517:10: warning: unused variable 'nBytes' [-Wunused-variable] 517 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:517:10: warning: unused variable 'nBytes' [-Wunused-variable] 517 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:517:10: warning: unused variable 'nBytes' [-Wunused-variable] 517 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:517:10: warning: unused variable 'nBytes' [-Wunused-variable] 517 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:517:10: warning: unused variable 'nBytes' [-Wunused-variable] 517 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:17: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:22: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:33:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 33 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:17: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:22: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:33:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 33 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:17: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:22: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:33:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 33 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:17: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:22: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:17: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:22: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetA21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:33:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 33 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ ttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:33:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 33 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:17: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:22: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:33:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 33 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:17: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:22: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:33:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 33 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:17: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:22: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:33:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 33 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:17: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:22: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:33:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 33 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ 15 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:17: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:22: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:33:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 33 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:17: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:19: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:22: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:33:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 33 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 15 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 15 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 15In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 15 warnings generated when compiling for gfx942. In file included from 15 warnings generated when compiling for gfx1101. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 15 warnings generated when compiling for gfx1200. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:712:16: warning: unused variable 'ret' [-Wunused-variable] 712 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:724:16: warning: unused variable 'ret' [-Wunused-variable] 724 | ncclResult_t ret = ncclSuccess; | ^~~ 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:712:16: warning: unused variable 'ret' [-Wunused-variable] 712 | ncclResult_t ret = ncclSuccess; | ^~~ :712:16: warning: unused variable 'ret' [-Wunused-variable] 712 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:724:16: warning: unused variable 'ret' [-Wunused-variable] 724 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:724:16: warning: unused variable 'ret' [-Wunused-variable] 724 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:712:16: warning: unused variable 'ret' [-Wunused-variable] 712 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:724:16: warning: unused variable 'ret' [-Wunused-variable] 724 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:712:16: warning: unused variable 'ret' [-Wunused-variable] 712 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:724:16: warning: unused variable 'ret' [-Wunused-variable] 724 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:712:In file included from 16/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ : warning: unused variable 'ret' [-Wunused-variable] 712 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:724:16:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:712:16: warning: unused variable 'ret' [-Wunused-variable] 712 | ncclResult_t ret = ncclSuccess; | ^~~ warning: unused variable 'ret' [-Wunused-variable] 724 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:712:16: warning: unused variable 'ret' [-Wunused-variable] 712 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:712:16: warning: unused variable 'ret' [-Wunused-variable] 712 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:724:16: warning: unused variable 'ret' [-Wunused-variable] 724 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:724:16: warning: unused variable 'ret' [-Wunused-variable] 724 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:712:16: warning: unused variable 'ret' [-Wunused-variable] 712 | ncclResult_t ret = ncclSuccess; | ^~~ :712:16: warning: unused variable 'ret' [-Wunused-variable] 712 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:724:16: warning: unused variable 'ret' [-Wunused-variable] 724 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:724:16: warning: unused variable 'ret' [-Wunused-variable] 724 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:724:16: warning: unused variable 'ret' [-Wunused-variable] 724 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 4 warnings generated when compiling for gfx906. 4 warnings generated when compiling for gfx908. 4 warnings generated when compiling for gfx1102. 4 warnings generated when compiling for gfx90a. 4 warnings generated when compiling for gfx1100. 4 warnings generated when compiling for gfx942. 4 warnings generated when compiling for gfx1200. 4 warnings generated when compiling for gfx1101. 4 warnings generated when compiling for gfx1201. 4 warnings generated when compiling for gfx1030. 4 warnings generated when compiling for host. [ 56%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc 15 warnings generated when compiling for host. [ 56%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:128:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 128 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:128:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 128 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:128:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 128 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:128:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 128 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:128:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 128 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:128:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 128 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:128:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 128 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:128:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 128 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:128:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 128 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:128:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 128 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:128:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 128 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx1100. 3 warnings generated when compiling for gfx90a. 3 warnings generated when compiling for gfx942. 3 warnings generated when compiling for gfx1030. 3 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 3 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from 3/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 3 warnings generated when compiling for gfx1200. 3 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 3 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 3 warnings generated when compiling for host. 1 warning generated when compiling for gfx942. [ 56%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx1200. 1 warning generated when compiling for gfx1201. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx90a. 11 warning generated when compiling for gfx906. warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for host. [ 56%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/generic.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/generic.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/generic.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/generic.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:203:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 203 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:406:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 406 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, ranIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:203:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 203 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:406:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 406 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ k, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:203:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 203 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:406:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 406 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/generic.cc:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:203:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 203 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:406:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 406 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:203:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 203 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:406:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 406 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ In file included from 2 warnings generated when compiling for gfx1030. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | staIn file included from tic ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:203:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 203 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:406:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 406 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:203:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 203 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:406:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 406 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ 2 warnings generated2 warnings generated when compiling for gfx942. when compiling for gfx1200. 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:203:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 203 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:406:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 406 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:203:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 203 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:406:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 406 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ In file included from 22 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:203:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 203 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:406:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 406 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx906. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx1201. 22 warnings generated when compiling for gfx1030. 22 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:9: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:10: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:203:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 203 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/coll_net.cc:406:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 406 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ 2 warnings generated when compiling for gfx1100. 22 warnings generated when compiling for gfx942. 22 warnings generated when compiling for gfx1102. 22 warnings generated when compiling for gfx1101. [ 57%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc 22 warnings generated when compiling for gfx1200. 22 warnings generated when compiling for gfx906. 22 warnings generated when compiling for gfx90a. 22 warnings generated when compiling for gfx1201. 22 warnings generated when compiling for host. [ 57%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_infoIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ _t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:183:14: warning: unused variable 'info' [-Wunused-variable] 183 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:185:12: warning: unused variable 'mh' [-Wunused-variable] 185 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:187:9: warning: unused variable 'gdrMap' [-Wunused-variable] 187 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:219:19: warning: unused variable 'md' [-Wunused-variable] 219 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:21: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:285:21: warning: unused function 'netDumpMap' [-Wunused-function] 285 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:21: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:285:21: warning: unused function 'netDumpMap' [-Wunused-function] 285 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.ccIn file included from :12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:21: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:285:21: warning: unused function 'netDumpMap' [-Wunused-function] 285 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:21: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:285:21: warning: unused function 'netDumpMap' [-Wunused-function] 285 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:21: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:285:21: warning: unused function 'netDumpMap' [-Wunused-function] 285 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:21: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:285:21: warning: unused function 'netDumpMap' [-Wunused-function] 285 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:21: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:285:21: warning: unused function 'netDumpMap' [-Wunused-function] 285 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:21: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSysIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ 16tem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) warnings generated when compiling for { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:285:21: warning: unused function 'netDumpMap' [-Wunused-function] 285 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:21: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:285:21: warning: unused function 'netDumpMap' [-Wunused-function] 285 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:21: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:285:21: warning: unused function 'netDumpMap' [-Wunused-function] 285 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ 16 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/gdrwrap.h:163:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 163 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:21: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_tmp.cc:285:21: warning: unused function 'netDumpMap' [-Wunused-function] 285 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ 16 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:30: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 16 warnings generated when compiling for gfx942. 16 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:30: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, inIn file included from t64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:30: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, ilnResult_tt xmlFind Tag(stmruct ncaclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) {xNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, co16 warnings generated when compiling for gfx1101. nst int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xm nlode, con,st cha r* attrsName, tconst rint valuue) { | ^~~~~~~~~~~~~c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.ht:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | stnatic nccclRecsult_t xlmlSetAttrFlXmlNode* parentoat(,struct nc clXconstmlNod ec*h anr*o desubName, struct nccl,X const cmhar* atltrName, Node** scuonst fbl) oat{ | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] valu347e) { | | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclRsesult_tt xmlSeatAttrLotng(struict nccclXmlNode * node,n const cchar* attcrName, clonst Rint64_te valusuel) t_t xmlAd{d | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.hT:267:21ree(stru: cwarning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | ts tnacctilXc m16l*ncc dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvlRCesult_t oxmlUnsnetAttr(structv ncclXemlNoder* node,t constT char*o attrNIame) n{ | ^~~~~~~~~~~~ t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21:( warning: unused function 'xmlGetSub' [-Wunused-function] c279 | statoic ncnclResulst_t xmtlGetS ub(strcucthar* str, int* va nclue, struct kvDict*cl XmlNodde* inode, const char* subNa warnings generated when compiling for gfx908. ct) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str,me, sstructt nccrlXmluNodec** subt) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21:k warning: unused function 'xmlGetSubKvInt' [-Wunused-function] v305 | Dstatiic nccclRestult_t* xmlGe tSubKdvInt(struct nicclXmclNotde)* {n o | ^~~~~~~~~~~~~~de, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:30: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:30: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:10: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2cclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:30: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h: 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:30: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) {164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node,ncclXml* xml, const char* tagName, struct ncclXmlNod/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:10: eIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:*14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: *warning: unused function 'log2i' [-Wunused-function] 44 | statinc lonog log2di(long ne) { | ^~~~~ ,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:30 : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21c: warning: unused function 'xmlAlloc' [-Wunused-function] 76o | static nncclResuslt_t xmlAtlloc(str uct nccclXml** xmhla,r * iantt trmaNxaNo | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | s const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* sdes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] In file included from me, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | ncsclRestatic ncclResult_t xmlSetAuttrIfUtnset(struct ncclltXmlNode* node, const char* attrName, const char* val_t ue) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xxmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* s111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* nodmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(strearchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | statiatic long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:30: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] uct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ c ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSe,e constt charA* subtName, tstruct ncclXmlrNode**I sub)f { U| ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:n305:21: swarning: unused function 'xmlGetSubKvInt' [-Wunused-function] e 305 | ts(tsattrircNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ uct c ncnccclRlXmlNesult_t xm/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] lGetSubKv 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ Int(struct ncclXmlNode* no 305 | dstateic nccl,Result _t xmlGetcSubKvIont(strunct nccslXmlNodet* node, const char* subNamce, struhct ancclXmlNode** sub, const code* hnode, const cahar* attrrName, *const char* value)a { | ^~~~~~~~~~~~~~~~~t /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:t228:21: rwarning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | Nstataic ncclmRee,s uclotn_stt ximnltS aettAttrtValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct nrInt(struct ncclXmlNr*o subNadme, streuct nc*clXmlN ode** snub, coonst dchar*e attrN,ame, const intc attrVoaluen) { | ^~~~~~~~~~~~~~s /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmtl Achar* attrNddNode(struct ncclXml* xml, structcclXmlNode* sr cNoden) { | ^~~~~~~~~~ c/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21:c warning: unused function 'kvConvertToInt' [-Wunused-function] lX377mlNode* parent, const cha | static ncclResult_t kvConvertToInt(came, coonst int nvalues) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.ht:241 :21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | staticc ncclRhesualt_t xmlrSetAttr*Float str, i(strunct tn*cc vlXalmlue,Nod struct kvDicet* node,* const chdaicrt* ) at{t r| Nr* sau ^~~~~~~~~~~~~~bName m, str/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.heuct ncc,lXml:Nod e**390 subc): { 21 | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h::334:21: owarning: unused function 'xmlRemoveNode' [-Wunused-function] warning: 334n | stunused function 'kvConvertToStr' [-Wunused-function] satt ic ncclResult_t 390 | fxsltatic ncclResoatu value)l { t _| ^~~~~~~~~~~~~~~tmlRe /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.hmoveNode(st:16254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | ruct ncclXmlNode* node) { | warnings ^~~~~~~~~~~~~ generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:30: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNod/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAkvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclReddsTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(ce** sub, const char* attorName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNonult_ts xmtde** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ lUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclRes chuar* stlr, int* tvalue, _structt kvDi ct* xdict) m{ l| ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.hG:390:e21: warning: unused function 'kvConvertToStr' [-Wunused-function] t390 | Sstautic nccblRes(ustrltu_tc t ncclXmlNode* node, const kvConvertTocStr(inht value,a const rchar*** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 16 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_ib.cc:30: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:76:21: warning: unused function 'xmlAlloc' [-Wunused-function] 76 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:111:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 111 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:118:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 118 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:125:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 125 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:133:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 133 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:140:21: warning: unused function 'xmlFindTag' [-Wunused-function] 140 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:152:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 152 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:164:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 164 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:180:21: warning: unused function 'xmlFindNode' [-Wunused-function] 180 | static ncclResult_t xmlFindNode(struct ncclXmlNode* parentNode, struct ncclXmlNode* searchNode, struct ncclXmlNode** node) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:203:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 203 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:216:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 216 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:228:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 228 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:241:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 241 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:254:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 254 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:267:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 267 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:279:21: warning: unused function 'xmlGetSub' [-Wunused-function] 279 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:305:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 305 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:312:21: warning: unused function 'xmlAddNode' [-Wunused-function] 312 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:334:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 334 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:347:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 347 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:377:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 377 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/xml.h:390:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 390 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 16 warnings generated when compiling for gfx1030. 24 warnings generated when compiling for gfx1030. 24 warnings generated when compiling for gfx942. 24 warnings generated when compiling for gfx1200. 24 warnings generated when compiling for gfx1100. 2424 warnings generated when compiling for gfx906. warnings generated when compiling for gfx908. 24 warnings generated when compiling for gfx1101. 24 warnings generated when compiling for gfx1102. 24 warnings generated when compiling for gfx1201. 24 warnings generated when compiling for gfx90a. 16 warnings generated when compiling for host. [ 57%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc 24 warnings generated when compiling for host. [ 57%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h44:13: :warning: unused function 'log2i' [-Wunused-function]13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h: 44 | static long log2i(long n) { | ^~~~~ 15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | sIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/net_socket.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ tatic long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx906. 2 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx908. 2 warnings generated when compiling for gfx1030. 22 warnings generated when compiling for gfx90a. warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 77 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. [ 58%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/nvls.cc:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx908. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx942. 2 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for gfx1030. 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx906. [ 58%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:215:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 215 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:226:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 226 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:237:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 237 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:249:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 249 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:262:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 262 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:272:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 272 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:283:13: warning: unused function 'isPow2' [-Wunused-function] 283 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/graph/topo.h:286:12: warning: unused function 'mirrorBits' [-Wunused-function] 286 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/comm.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/p2p.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/core.h:38: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/utils.h:44:13: warning: unused function 'log2i' [-Wunused-function] 44 | static long log2i(long n) { | ^~~~~ [ 58%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_gather_sum_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_gather_sum_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_gather_sum_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_gather_sum_i8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp 2 warnings generated when compiling for gfx1030. 2 warnings generated when compiling for gfx908. 2 warnings generated when compiling for gfx906. 2 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx942. 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for host. [ 58%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:20:15: warning: unused variable 'bid' [-Wunused-variable] 20 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:20:15: warning: unused variable 'bid' [-Wunused-variable] 20 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:20:15: warning: unused variable 'bid' [-Wunused-variable] 20 | const int bid = In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const iIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ nt w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:20:15: warning: unused variable 'bid' [-Wunused-variable] 20 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:20:15: warning: unused variable 'bid' [-Wunused-variable] 20 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:20:15: warning: unused variable 'bid' [-Wunused-variable] 20 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cppIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:20:15: warning: unused variable 'bid' [-Wunused-variable] 20 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:20:15: warning: unused variable 'bid' [-Wunused-variable] 20 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:20:15: warning: unused variable 'bid' [-Wunused-variable] 20 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:20:15: warning: unused variable 'bid' [-Wunused-variable] 20 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:20:15: warning: unused variable 'bid' [-Wunused-variable] 20 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75In file included from :7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_2, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: : unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | : const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | : const 366int bid = ncclShmem.channelId - work->channelLo; | ^~~ :15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const iIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hnt bid = ncclShmem.channelId - work->channelLo; | ^~~ :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_4, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:171:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 171 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllGather_RING_LL128_Sum_i8_2, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_2, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_2, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_2, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_2, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:171:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 171 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllGather_RING_LL128_Sum_i8_2, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_2, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_2, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_2, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_4, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllGatIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_2, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670her_RING_SIMPLE_Sum_i8_4, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RI | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NG, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreadexpanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ s(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_2, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_4, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_2, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_4, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_4, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_4, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_4, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_4, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_4, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:58:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 58 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_gather.h:157:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 157 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8_4, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: :60: note: field 'group' will be initialized after field 'stepSize' 670 | t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ id(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthrea2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' ds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: In file included from warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReducIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(te_RING_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: id), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TIn file included from REE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) idInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | :670: 15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloa Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>()t16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ .run(); \ > ().run| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grou:15: pnote: field 'nthreads' will be initialized after field 'tidInBlock' )670 | , tid(tid ), n threads(n| threads), tidIn ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60Block(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: : field 'group' will be initialized after field 'stepSize'note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nth 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ reads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ ==/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PR_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ OTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for gfx1030. 11 warnings generated when compiling for gfx906. 11 warnings generated when compiling for gfx1200. 11 warnings generated when compiling for gfx1100. 11 warnings generated when compiling for gfx1201. 11 warnings generated when compiling for gfx1102. 11 warnings generated when compiling for gfx908. 11 warnings generated when compiling for gfx1101. 12 warnings generated when compiling for gfx942. 12 warnings generated when compiling for gfx90a. [ 59%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from :75/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp::2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:117: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | warning: barrieunused variable 'w' [-Wunused-variable]r_by_grou p(); 75 | | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29ba:15:rrier_by_group(); | ^~~~~~~~~~~~~~~~~~ note: expanded from macro 'barrier_by_group' 29 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hIn file included from :174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7:barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE;In file included from \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WIn file included from ARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uiIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ nt32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = nIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ cclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | fIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIlagThreZad((tid%4)==3)E, group()group), | , ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | s tepSize(ncclSh mem.co| ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) mm.buffS497izes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PR: Onote: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | T Oprims(tid,_ nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ LL128, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthrea/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cppd:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11s: In file included from )/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: ,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29 : warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] w496 | itid(tid)d, nthrea(ds(nthretads), wiid(tid%WAdRP_SIZE)%, warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE),WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ( warp(tid/WARP_SIZE 498g | flargThread((otid%4)==3u), groupp(group)), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | , warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize (ncclSh mem.c| omm.bu ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ffSizes[NCCL_PRO T O| _ warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 L499 | stepSiL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group ze(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(step:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.commSiz.e_ == 0 ?b ncclShmem.comm.buuffSfizes[NCCL_PRfOTO_SIMPLSE]/NCCL_STEiPS/sizeof(zT) :e ss[tNeCpCSLi_zPeR_OTO_SIMP) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from X_DEV_ARITY, 1>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmemncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatc.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 1>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), ntthrehads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ reads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ d), nt hreads(nt| hreads), tidInBloc tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_k(threadI dx.x), gr oup(group), | ^~~~~~~~~~~ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threa/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hdIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBa/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.htch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunW, RedOp, ProtoSimple<1, 1, COLL_orUNROLL>, COLL_UNROLL>k(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ n, T, RedOp, Algo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: Size_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadI2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] dx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloa/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.ht8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, s/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthrubetn, work); | ^a /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:22:d1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here s22 | DEFINE_)ncclDevFu,nc(AllRedu ce_RINtG_SIMPLE_MiinMax_bfd8_4, ncclFIuncAllRedunce, FuncMiBnMax, rccll_bfloato8ck(threadIdx.x, NCCL_ALGO_RING, NCCL_PROTO_S), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ IMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidIn/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threBlock(threadIdx.x), gro/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hup(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PadIdxR.x), group(group)O, | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_T 671 | O step_Size(stepSiSze_ == I0 ? ncclShmeMm.comm.bPuffSizeLE]/NCCL_STEPS/si:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' zeof(T) : ss[NCCL_PR 611 | OTO_SIMPLE] RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254tepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direc:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested heret 254 | = Pri*mitives,t /*Diro, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | ect=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ .x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSize/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hs[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> p17rims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduc warnings generated when compiling for host. e, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(groumetric<1, NCCL_MAX_DEV_ARITY>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), ntp), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ = if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_= 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15 : warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tinote: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | d(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ if (tid < subtn) RunWorkalgo, proto/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), , unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(tidInBlock(threadIdx.x), groupA(lgroup), | ^~~~~~~~~~~ lReduce_RING_SIMPLE_MinMax_bf8_thr4eads(nthr,eads), tidInBlock(threadIdx. x), grounp(group)c, | ^~~~~~~~~~~ clFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | st:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ epSize(stepSize_ == 0 ? ncclShmem.comm.buf/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hfSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | /0, ProtsotepSize, 0(> primss | ^ t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:e5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runpTreeUpDSown, C=OLL_UNROL=L 0>( ? ncclShmem.comm.buffSizes[NCtid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | CL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives(c).run(trk); | ^, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp 0, :P17roto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5:1:: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | Dnote: EFINE_in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested herencclDevFunc(AllReduce_TREE_SIMPLE 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432_Min | Max_bf 8_4, nc clFuncAl lReduc e, Func MinMax, rccl_bifloat8, NfCCL_AL GO_TREE, (NCCL_PROTO_SIMPLtE, 4) id < subtn) RunWorkColl, algo, protoo, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_4, , unnroll>()c.run()c; \ | l ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670F:15: note: field 'nthreads' will be initialized after field 'tidInBlock' u 670 | tid(tid), nnthreadsc(nthAreads),l tidInBllock(thRreadIdxe.x), gdroup(guroup), c| ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.he:670:60, : Fnote: unfield 'group' will be initialized after field 'stepSize'c Min670 | M ax , triccdl(_tbifdl)o,at8 nthreads(nthreads), , NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, tidInBplock(rthreaodIdx.tx), grooup(gro,up), | ^~~~~~~~~~~ unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFIN 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinNMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ ROLL>(tid, nthreads/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gro, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); up), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthread/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: s(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8_4, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1101. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 59%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, fIn file included from lag1,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2 : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hd:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7a: warning: unused variable 'w' [-Wunused-variable] 75 | t baarrier_b2y_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | connote: expanded from macro 'barrier_by_group' s29 | ctonst int w = thireadIdx.nxt w = t/WAhRP_SIZEr; \ | e ^ adIdx.x/WARP_SIZE; \In file included from | ^ , flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cppata2:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: , flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | co:366:15n: warning: unused variable 'bid' [-Wunused-variable] s366 | t int w const =inIn file included from threadIdx.x/t bWid = ncAclShmRe/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from m/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: .In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hchannelId :75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hP_S:IZE;29:15: note: expanded from macro 'barrier_by_group' 29 | const int \ | ^ - work->channelLo; | ^~~ w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group();In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), ntit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 1070 | runTreeSplitepSize((stepSitze_ == i0 ? ncdclSh, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f16_2:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COL, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ L_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:REE, NCCL_PROTO_SIM175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatcPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ h, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO g_roup(gSroup),I | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~M | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ P671 | LstepSiEze(ste]pSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] ,670an | Asy m/metr i*cd, /*Dci(rectt=t*/0,= iProt*od, 0>/ p)rim0s , | ^, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h :565 :5n: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested hereP t 565 | r h rounrTreteUepDowonanle<1, t1, CpOhLL_UNrRrOLL>i,e COLmLa_UNRs ds), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(ti | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | OLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h runTreeUpDown, 0, 2, 4>::run' requested here N432 | R Oif (tidd , subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Run,Wor kColCOLL_UNROLL>(tid, nthreaIn file included from ds, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE,432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (l().nrun()tid, subRtn, uworkn); W| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cppo:17:r1: note: kin instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here C17oll().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Al NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ lReduce_T16_4,R nccElFunEcAll_ReduSceI, FunMcMinPMaLx, hEalf,_ NCMCL_AiLGO_nTREME, NaCCL_xPROT_O_SIfMPLE1, 4)6 | ^_ 2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMP/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hL:611:E62: note: ,expanded from macro 'DEFINE_ncclDevFunc' 611 | 2 Run)WorkB atch , a:lgo611, pr:oto,62 u:nrol l>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthr15: enote: field 'nthreads' will be initialized after field 'tidInBlock' a670 | d tsid(t)id),, nth readst(nithreadds),I tidnInBlBock(lthreadIdx.x),o group(groucp), k | ^~~~~~~~~~~~~~~~~ (/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:t60: note: field 'group' will be initialized after field 'stepSize'h 670r | e tida(tidd), ntIhreadds(nxthrea.ds),x tid)InBlo,ck(t hreagdIdxr.xoup(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:), group(group), | ^~~~~~~~~~~ 60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nIn file included from threads/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h):11: In file included from ,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670 :15: warning: initializer order does not match the declaration order [-Wreorder-ctor] t 670 | i tid(tdid), nIthreadnBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ s(nt/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hhreads), :tidIn670Block:(thre60adIdx:.x) , gronote: up(grfield 'group' will be initialized after field 'stepSize'oup) 670 | tid(tid), , | n ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ t 671 | h rsteads(nthreaepSize(stepSds), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | :5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | ti | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' d(tid), nthreads(nthreads), tidInBlock(threa 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Pr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0oto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, CO ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ LL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h :611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ tid(tid), nthread 671 | ss(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, halefads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWork/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Coll().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthrea/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670ds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: 17 warnings generated when compiling for host. note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCC/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] L_PROT O670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, C/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid),, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, wor/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclSk); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hhmem.comm.buffSizes[NCCL:432:78:_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtnN,CCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(th work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cppreadIdx.x), group(group), | ^~~~~~~~~~~ :17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_2, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16_4, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx942. 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1200. [ 59%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 21 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ [ 59%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cppIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrierIn file included from _by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: In file included from warning: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5:unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclSIn file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ hmem.channelIIn file included from d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:In file included from 15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :218/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gro/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ up(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, ntthirde(atdisd,) ,w onrtkh)r;e a d| s ^( nthreads), /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.ht:i432d:I78n:B lnote: oin instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested herec k(thread I432d | x . x ) , girfo u(pt(igdr oc(c)l.Srhumne(mt.icdo,m ms.ubbutfnf,S iwzoersk[)N;C C L| _ ^P ROTO_SIMP/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cppL:7E:]1/:N Cnote: Cin instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested hereL _STEPS/siz e7 | oDfE(FTI)N E:_ nsctcelpDSeivzFeu_n)c ({A l l| R ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~e d u| c group(groupe _TREE_SIMPLE_MinMax_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hf:33032:_902:, note: nin instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested herec clFuncAllR e303d | u c e , F uPnrciMmiintMiavxe,s ,| ^/ *Dire/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hct:=611*:/620:, note: Pexpanded from macro 'DEFINE_ncclDevFunc' roto, 0611> | p r i RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ms | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h if (tid < subtn)In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp: RunWo2rkCol: l()175.r: un(t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.hid, s:ubtn,498 work:); 29 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1:: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEwarning: FI:670:field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]15: warning: initializer order does not match the declaration order [-Wreorder-ctor] N670 | E _ tid496n(tid | )c, n tclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreadshr(eads(nnthreatds), htidInBrlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proteads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ o, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ROLL>/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. L_UNROLL>, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_2, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.bu/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32_4, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid =:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ o; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ OLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMP/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ duce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stSIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_f64_2, ncclFuncAllReducepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ e, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | i/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hf: (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> primwork); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' s | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_S/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ >().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_2, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64_4, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1200. 21 warnings generated when compiling for gfx942. 21 warnings generated when compiling for gfx90a. [ 60%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 60%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ In file included from | ^/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE;In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ data1, flag1, data2, fIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1,lag2 ; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hd:145:28: awarning: unused variable 'data2' [-Wunused-variable] 145 | t uinta32_t dat2a1, flag1, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h, d:ata2, f145lag2; : | ^~~~~21: warning: unused variable 'flag1' [-Wunused-variable] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h :145145 | uint32_t data:35:1 warning: unused variable 'flag2' [-Wunused-variable] 145 | , uin t32_t flag1, datIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ a2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t da t145 | a u1int3, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | 2_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w =/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.ch/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hannelId - work->:218:channelLo; | ^~~ 15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->chanIn file included from nelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: 15In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: :In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7warning: : warning: unused variable 'w' [-Wunused-variable] unused variable 'bid' [-Wunused-variable]75 | barri218 | const int bid = ncclShmem.channeer_lby_grIoup()d; | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = thr- work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.headIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | 218 con | st c oint binst int bid = nd = ncclShmem.channelId - work->/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from channelLo; | ^~~ cclShmem.channelId - work->channelLo; | ^~~ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid =In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:c174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7:c warning: unused variable 'w' [-Wunused-variable] 75l | Shmem.channelId - work->channel L boarrier_;by_group( ); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:| ^~~ 15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flagIn file included from 2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t daIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ta1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ E; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->unused variable 'bid' [-Wunused-variable]c 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ hannelL/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ o; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizesIn file included from [NCC/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthL_PrROTO_SIMePLE]/NCCL_SaTEPS/sizeofd(T) : sstepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> pri(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmemsm | ^ ./builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5c: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here o565 | rmunTreeUpmDown), nthr,ead_s(n tShreaCTEPS/sizeof(T) : stOLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < sudsb), titdInBlnock()threa dIdx.xR), gruoup(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.cepoSize_m) { m | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~. | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hb:254u:90: note: fin instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254f | S Primiitzives, roto,/ COLL*_UNRODLL>_PiR(OTOr_)SIMeP.LE]c/rNCCtLu_S=*/0, Protn(tid,o su,btn, w0T>EPS /sipozerrofik(Tm)) s;: st ep| | Si ^ ^ze _/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~:: 5657| group(group:: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h5:1:: 254:note: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDownin instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPL90:E note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here_ M254 | i n PMrimiativxes<_T, fRed8O_p, 2FanA,sym metnriccRled,ROp e, /dPr*uotDcoSieimr,ple e,P COrLL_oUNRtOLLo>(ti,d, nth0rea>ds, woprk)r; i| ^nm M/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hs ax , r| cc ^l_ :fl/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h432o:at878, ::NCC L_note: 565in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested hereA:5 L: Gnote: 432 | O_T REE , in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here N iC565 | fC L _(ruPtinTrd Ru(nWo)rk.BatrchLL>,, C OLLa_UlNROgLL>o(ti,d, nthpreards,o wotrk);o | , ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h :uun432n(t:rido78, l:sul bt>note: nin instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here,( w )or.kr); u | ^n /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: (note: 432)in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here | ; \ 7 | | D ^Ei Ff/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h I(NEt:_i670nd:c 15c<:l Dsnote: eufield 'nthreads' will be initialized after field 'tidInBlock'vb Ft nun)670c ( | AR lu ln RW eotdriukdcC(eotil_dlTRE),E< _FnSntI,MhPreL aEdT_s, R(nthredeOMapid,ns M)Aa,lx g_toif,d8 I_Pn2rB, otnolc,oc clCkFO(uLtnLhcr_AeUlaNldRRIOedLdxL>u.(cx)e).,,r uFgnur(notcuiMpdi(,gnr Mosauuxpb,t) n,r, c cw| l ^~~~~~~~~~~~~~~~~o_ rf/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hkl);o: a670 t:608| :, ^ note: N/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cppCfield 'group' will be initialized after field 'stepSize' C L:7_670:A | 1L :G O note: _ in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested heretT iR EdE(7,t | iDNdEC)FC,IL N_nEPt_RhnOrcTecO_adSslI(DMnePtvLhFEru,en ac2d()sA )l ,l| R^tedu /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hc:ei611_d:TI62Rn:EB Elnote: expanded from macro 'DEFINE_ncclDevFunc'o_Sc Ik M(611PtLE | _ hM riRenuaMndaWIxod_rxfk.8Bx_a)2t,,c hgn, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' CCL_670AL | GO _T RE E, NtCCiL_dPR(OTtO_iSIdMP)LE,, 2)n t| ^h /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hr:e611:a62:d s(nthreads), tidInBlock(threadIdx.x), gronote: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreaudp(sgr)o,up) , t | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ idInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(ti:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:d), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TRE175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WAE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ RP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hexpanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primit=*/0, Proto, 0> primstives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rc | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hcl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads432 | ( if n(tid < t 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ subtn) RhunWorkCroll().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h NCCL:_PROT565O_SI:MPLE,5 2) :| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h :611:62:note: note: expanded from macro 'DEFINE_ncclDevFunc' in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here611 | RunW orkBatch565, algo, protro, unuroll>n().ruTn(); r\ | ^ e/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' e670 | U pDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dcx.kx(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE ) , gro498up( | gro up), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' f670l | a tigd(tTid)h, nrthreeads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ad((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid),tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h: nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | 432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < 670 | tid(tid), nthreads(ntsubtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ uffSizes[NCCL_PROTO_SIMPLE]/ AlNgo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^GO_T REE, N/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hCCL_PROTO_S:IMPLE,558 4) :| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:562: note: expanded from macro 'DEFINE_ncclDevFunc' : 611 | RunWnote: orkBatin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested herech, al | go, runRing().rUun()N; \ | R ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:O670:LL>(15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads)tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work), ;tidI nBlock(threadI dx.x| ), g ^roup (gr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cppoup), | ^~~~~~~~~~~~~~~~~ :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:67012:60: :note: field 'group' will be initialized after field 'stepSize' 1670 | : t id(tnote: id),in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here nth reads (nthread12s), | tidIDnBloEck(tFhIreadNIdx.Ex), _grounp(group), c | ^~~~~~~~~~~ clDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().r:670:15u: warning: initializer order does not match the declaration order [-Wreorder-ctor] n670 | t(id(tid)t, nthreiads(nthrdeads), ,tidInBl ock(thrseadIdx.ux), grobup(groutp), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ n, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEF | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ I 671 | N stepSizEe(step_Size_ =n= 0 In file included from cclDevFunc(AllR? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/s/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid),e duce_nRING_tSIMPLhE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, izeNof(T)C : stCepSiLze__) { P| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ R| group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hO:303:90:T note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here O303 | _ PSrIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatchAsymme,tri/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkCollo, /*, proto, Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:r565eads:(nth5read:s), tidInote: nBin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested herelock (th readIdx.565x), | gro up(g rFn, T, RedOp, Algo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, pr oup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~r | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_u 671n | T rstepeSizee(steUpSizep_ ==D 0 ?o nccwlShmnem.c().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tiodto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ InBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60:T, R edOpnote: , Pfield 'group' will be initialized after field 'stepSize'rotoS imppSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 670 | t 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ id(tid),le <1,n 1,t COhLL_UrNROeLL>a, CdOLLs_UN(ROLnL>(ttidh, nrthreeadas, dworsk);) | , ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h :t432:78i: note: din instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here I432 | n B lif o(ticd ().run(tid,x.x), group(group), | ^~~~~~~~~~~ subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | run/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, TreeUpDown, COLL_U 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threain instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMi/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hnMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grothreadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254up(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | Primitives, /*Direct=*/0, PrIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | oto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, RunWnorkBatch, algo, proto, unroll>().run(); \ | ^ threads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) Ruif (tid < subtn) RunWorkColl().run(tid, subtn, work); | nWorkColl().run(tid, subtn, work); ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllRed | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ uce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCC/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | r:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizeusnTreeUpD[own, PROTO_SIMPLE]/NCCL_STEPS/COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565_UNRO | LL>( ).run( tid, subtn , wrunTreeUork);p | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cppD:17:o1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested herew 17 | nDEFIN, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) Ru_nSIMPLWE, 4)o | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hr:611:62k: note: expanded from macro 'DEFINE_ncclDevFunc' C 611 | o RulnWorkBatch, al().run(tid,oto , usnroull>b().trun(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), n, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, Fgurounp(gcrouMp),i | ^~~~~~~~~~~~~~~~~n /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:M670:60a: note: xfield 'group' will be initialized after field 'stepSize' ,670 | r ticd(tcid)l, n_thrfeadls(ntohreaadst),8 ti,dIn BloNCcCk(thLrea_dIdxA.x)L, GgroOup(_groTREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | up), | ^~~~~~~~~~~ RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadId/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] x.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPL/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn)E_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_2, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ threadIdx.x), group(gro/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid),up), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBloc| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hk(threadIdx.x), group(gr nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? nc:clShmem.670comm.b:uffSiz15es[NCC:L_PRO TO_SIMwarning: PLE]/Ninitializer order does not match the declaration order [-Wreorder-ctor]CCL_ 670 | tid(tid), nthreads(STnEPS/sitzeof(Th) : strepSizee_) { a| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(groupds), tidIn /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here Block(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SI254 | M PPrimitiLves, /*DiSrect=T*/0, PrEoto, 0P> priSms | ^/ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:s5izeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here : note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558L>,: COL5L_UN:ROLL >(tinote: d, nin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested herethre ads, work);558 | ^ | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h :432:78 : note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | r iuf (tnid (tid, nthreads, worrkkColl, 1, 2, 4>::run' requested here 432 | ro toi, CfOLL _UN(ROLtL>(i).rudn(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFIN < subtn) RunWorkColl().run(tid, subtn, work); | ^E_n ccl/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cppDevFunc:(Al22lRe:duc1e_T:REE _SInote: MPLin instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested hereE_M inM ax_f8_224, | nccDlFunEcAFllReIducNe, EFun_cMinnMacx, crccll_fDleoatv8,F NCuCL_nALGcO_(TREAE, NlCCLl_PRROTOe_SIdMPLuEce_RING_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, Fu, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unry,o reldop>, (alg)o, .prorto, uunrnoll(>()).r;un() ; \\ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h| :670 ^:15: note: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hfield 'nthreads' will be initialized after field 'tidInBlock' 670 | : t670id:(ti15d),: nt hrenote: ads(field 'nthreads' will be initialized after field 'tidInBlock'nth rea ds), ti670d | I nBl ock (th reatdIdix.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nd(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreadsthreads(n(thrneadts),h tirdIneBloack(dthrsead)Idx,.x) , gtrouip(gdrouIp),n | B ^~~~~~~~~~~ lock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UN>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.RxOLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90In file included from : note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ runTreeUpDown, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.b/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, ProtuffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NCCL_MAX_DEV_ARITY>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, Func tid(tid), nthreads(nthreads), tidInBlock(threMainMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(t:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(steipd), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Size_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> priIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] ms | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < su 77 | uint32_t y, head, mantissa; | ^ btn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8_4, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ const int w = In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclSIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from hmem.ch/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hannelI:d - wor174k->cha: nnelLo/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h; | ^~~ :75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = th/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2r: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: eIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.ha:145:14: warning: unused variable 'data1' [-Wunused-variable]d 145 | I uintd32_t dxata1, .flag1x, da/tWARP_SIZE; \ a2| , flag ^2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h :175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80 :5: warning: unused variable 'w' [-Wunused-variable] c 80 | o barnrier_bsy_groutp(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29i:15: note: expanded from macro 'barrier_by_group' n29 | t c onst inwt = threadIdx.x/W Aw = thRreadIdPx.x/WA_RP_SSIZE; \ | I ^ZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrie/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366r_by_g:roup();15 | : ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29 :15: note: warning: expanded from macro 'barrier_by_group' 29 | unused variable 'bid' [-Wunused-variable] con st int w = threadI366dx.x/W | ARP_SI ZE; \ | ^ const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable]In file included from 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp: note: expanded from macro 'barrier_by_group' 29: | co2nst int w = threadIdx.x/WARP_SIZE; \ | ^ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_S/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hI:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ ZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(gr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(noup)t, | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3h 499 | r stepSize(encclShmem.acomm.buffSdizes[NCCL_s), tidInBlock(thrPROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, treeeadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Pr->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work)i;mitive s, /432*Direc:t=*/780, Pro:to, 0> pnote: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if rims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ runTreeUpDown, COLL_UNROL(tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(L>A(tidl, ntlhreaRds, ewodrk);u | ^c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.he:432:78_: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested hereT 432 | R E ifE (ti_d < LsubtnL) Ru1nWor2kCol8l_MinMax_u32_2, ncclF().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFuuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ nc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL1 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128,28, 2) | ^ 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthrea:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGcclSOhmem_.comTm.buRffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]ads-nthreadsSplit, &tree 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' ->up, tree->down, workEE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, -p>senrdbufof, wtork-o>rec,vbuf f,u | ^n /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:r1070:5:o note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here l 1070 | l r>unTr(eeS)pli.t(rtid,e nthareadds, wosrk);) | ^, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h :432:78t: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here i 432dInBloc | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TOp, FanAsymmetric<1, NCCL_MAX_DEV_ARITY>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ REE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInB_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ lock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBmem.comm.bulock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : s:670:15:t warning: initializer order does not match the declaration order [-Wreorder-ctor] e670 | p tid(tSid), ntihreadsz(nthreaeds), ti_dInB)lock(th readId{x.x), group( group),| | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSi| ze(ste group(grouppSize_ == 0/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h ? ncclShmem.comm.buffSi:zes[N303CCL_PR:OTO_S90: note: IMPLE]/NCCin instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested hereL_STEP S/size of(T) : ste565pSize_) | { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h :63:56 : note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Prrimituives, e0, ProtUo, 0> pprims D| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:o558:5: note: win instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | n (tid,ROLL>, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, 1, 2, 2>::run' requested here L432 | L if (t>id < su(btn) Ru)nWorkC.oll().run,(tid, s ubtn, swork);u | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cppb:12:1t: n, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllRein instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGOdu_ce_RTING_RSIMPELE_MEinM,ax_ u32_N2, nCcclFCuncAlLlRed_uce,P FuncRMinMaOx, uTint32O_t, _NCCLS_ALGIO_RIMNG, PNCCL_LPROTEO_SI,MPLE , 2)2 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: )note: expanded from macro 'DEFINE_ncclDevFunc' 611 | R| unWo^rkBa tch/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h, algo, proto,tch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gro uunrpoll)>(),.ru n() ; \| | ^~~~~~~~~~~~~~~~~ ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h670:15: note: :field 'nthreads' will be initialized after field 'tidInBlock' 670670: | 60 t:id( tidnote: ), field 'group' will be initialized after field 'stepSize'nth rea ds(n670thr | ead s), tidIn Blo ck(tthrieadIddx.(x),t grioupd(gr)oup,), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(thread nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Idx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(thre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ adIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/N/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ CCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduc:e, Func670MinMax, :uint3215_t, NCC:L warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), _ALnGO_TREEt, NCCL_hPRreads(nthreadsOT)O_SIMP,LE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.htidInBlock(threadIdx.x), gro:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatchC, algLo, pr_oto, unroll>().run()P; \ | R ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hO:670:15:T note: field 'nthreads' will be initialized after field 'tidInBlock' O670 | _ tidS(tid),I nthrMeaPLE]/NCCLds(n_threaSdsTEPS/sizeof(T)), tidI:nBloc k(thrsetepSize_) { | adI ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~dx.x ), gr oup(| grou group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90:p), | note: ^~~~~~~~~~~~~~~~~ in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670 :60254: note: field 'group' will be initialized after field 'stepSize' | 670 | Primitive tid(tid), ns, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hthreads(nt:hrea565ds),: ti5dInB:lock (thrnote: eadIin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested heredx.x) , group(gro565up), | | ^~~~~~~~~~~ runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.ha:670d:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] s670 | ) tid(ti,d), nthre adtidInBlock(thres(nthraeads), tiddInBlock(IthreadIdx.xd), group(xgroup), . | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ x 671 | ), grou stepSp(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | iz e(stepSize _ == 0 ? ncstepSize(stepSclShmeim.comm.ze_ == 0 ?buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | M PrimiAtives, /*Direct=*/0, Proto, 0> prims | ^ FanAsymmetric<1, NCCL_MAX_DEV_ARITY>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here S 565 | i runTrmeeUppDown, CO,LL_UNR OLL>(tCid, nOLL_UNROLL>, COLL_UNROLL>(tid, nthreads, wothrreads, kwork);) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h;:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | | ^if /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < s (tid < subtn) RunWorkColl().rgo, uPronto,( COLtL_UNiROLLd>().,run( tid,s subutn, bworkt); n| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp,:7 :1: wnote: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here o7 | DErFINkE_ncc); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32lDev_Func4(AllR,educ e_TRnEE_ScIMPLEc_MinlMax_Fu32_u2,n nccclFunAcAlllReducle, FRuncMeinMadx, uuint3c2_t, eNCCL,_ALG O_TREFuE, ncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch62: note: ,expanded from macro 'DEFINE_ncclDevFunc' 611 | a RunlWorkgBatcho,o algto, poroto,, un rollu>().nrun()r; \ o | ^ l/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670l:15: >note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | ( tid()tid)., run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(nthreads(nthreads), tidInBlock(threadtid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(groupId)x.x),, gr oup( grou| p), ^~~~~~~~~~~ | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadId/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ TO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ SIMPLE]/NCCL_STEPS/sizeIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Pof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ lgo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:hreadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBloIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid ck(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize<_ subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().r/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ un(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_M/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] inMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670: 15670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_2, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkB | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_a tch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ == 0 ? ncclShme/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); m.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/ s| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ izeof(T) : stepSize_)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | ru/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMnTreeUpDown, COLPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives(tid, nthreads, work)FanSymmetric<1>, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_nccl,D RedOp, ProtoSimple<1, 1, COLL_UNROLL>, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ evFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, Fun/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hc:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ MinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(.x)t, group(igroup), d | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:)670:60: note: field 'group' will be initialized after field 'stepSize', 670 | tid(tind)threads(nthr, nthreeads(nthareads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ds), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlo:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]ck( thread 670 | Idx .x), gr tioupd(tid), n(grotup), hreads(n| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | t tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ hreads), t 671 | stepSiidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSzei(stepSizez_ == 0 ? encclShmsem.comm.[buffSizesN[NCCL_PCROTO_SIMCPLE]/NCCLL_STEPS/s_izeof(T) P: stepSizRe_) { | O ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hT:63:56:O _SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) note: {in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Prim itives, | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h0, Proto, :303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | 0> ^ prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runR:ing5(tid, nth:reads, work); note: | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work);LL_ UNROL L>().ru| n(tid ^, subtn , work/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:22:1: note: :432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | ifin instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | (DEFINEt_ncclDeivFunc(AdllR < subeducte_RnI) RunWorkColl(FuncM)inMax,. run(tidui,nt32_t , subtn, work); | ^NC CL_ALGO/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp_RING, NCCL_:17:PROTO1:_SIMPL note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuEn, 4) c | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:M611:62: inote: expanded from macro 'DEFINE_ncclDevFunc' 611 | n RuMnWorkBaatcxh, ailgo, pnroto,t unroll3>().ru2n(); \_t, NCCL_ALGO_T | ^R /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:E15: E, NCCL_PROTO_SIMPnote: field 'nthreads' will be initialized after field 'tidInBlock' L 670 | E tid,(tid), 4) n | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBthreadas(nthretads),c tidInhBlock(thre, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | ad Id17x.x)t, groid warning(s generated when compiling for host. tid), up(gronup)t, | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hh:670:60: rnote: field 'group' will be initialized after field 'stepSize' 670 | e tiad(tid),d nthreasds(nthr(eads),n tidItnBlockhreads), tidInBlock(threadIdx.x)(th,r egadIrdx.ox), ugropup((grougpr), o | ^~~~~~~~~~~u p), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32_4, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1101. 21 warnings generated when compiling for gfx942. 21 warnings generated when compiling for gfx90a. [ 60%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t In file included from data1, flag1, dat/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from a/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:1752: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5:, In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ warning: unused variable 'w' [-Wunused-variable] 80 | f balagrrier_2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from a/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:t173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7a: warning: unused variable 'w' [-Wunused-variable] 175 | , flag1, data2, barrier_by_group(by_gr)oup(); ;| ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h :29:15: note: expanded from macro 'barrier_by_group' 29 | | co ^~~~~~~~~~~~~~~~~~nst int w = th/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hreadIdx.x/WA:RP_SI29:15: note: expanded from macro 'barrier_by_group' 29 | ZIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ E; \ | c ^ onst int w = threadIdx.x/WAflag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flagRP_S1IZE; \ | ^ , data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channeIn file included from lId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.xIn file included from /W/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:ARP_SIZE; \ | ^ In file included from 2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27| ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h | :29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/ const int bid = ncclShmem.channelId - work->channelLo; | ^~~ WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data:218:15: warning: unused variable 'bid' [-Wunused-variable] 2, flag2; | 218 ^~~~~ | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h const int w = threadIdx.x/WARP_SIZE; \ | ^In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const iIn file included from In file included from nt bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15145: warning: unused variable 'bid' [-Wunused-variable] :27 | 28: warning: unused variable 'data2' [-Wunused-variable]const int bid = ncclShm145em.cha | nnelI d - w ork->ch annel Lo; | u ^~~ int32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | conIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ st int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:\27 | ^ :15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->cIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - worhIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ annelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShkm->channelLo; | ^~~ em.channelId - work->channelLo; | ^~~ - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work-> ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ channelLo; | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here In file included from 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | Run/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:W2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.ho:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173r: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15k: warning: initializer order does not match the declaration order [-Wreorder-ctor] B670 | a tidt(tid),c nthreahds(nthreads), , algo, proto, unroll>().run(); \ | InBlo ^ck(thre adIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSSIMiPLE,z 2) e | ^ (/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611s:62: note: texpanded from macro 'DEFINE_ncclDevFunc' e611 | p RuSnWorkiBatczh=, al go, proto, 0unro ll>(?).run (); n\ | c ^ c/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:l670:15: Snote: field 'nthreads' will be initialized after field 'tidInBlock' h670 | m teid(tmid),. nthcreados(nthreads), tidInBlock(threadIdx.x),mm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group gr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.houp(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h::670:60254: note: field 'group' will be initialized after field 'stepSize': 67090 | : ti d(tinote: d), in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested herenthr eads (nthread254s), | tidI Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, su warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3b 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < stn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce,ubtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadId/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), : note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads) ,| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ t671 | i sdtepSIize(nsteBpSizle_ =o= 0 c? nckclSh(mem.tcomhreadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: m.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670In file included from :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | 15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | PrimitivesIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ , 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthread(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ s(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroIn file included from ll>().run(); /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, N\ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ CCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STE 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ PS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | t warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ id(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(thre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBladIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Directo=ck(threadIdx.x), group(group), | ^~~~~~~~~~~ */0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNRIn file included from OLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(s | DEFtINE_nccelDevFunpc(AllRedSuce_TREiE_SIMPLzE_MinMaex_u64_4,_ ncclFu ncAllRe=duce=, FuncM inMax, u0int64_t , NCCL_?ALGO_TR EE,ncclShmem.c NCCoL_PROTOm_Sm.bIMuPLEffSizes, [4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nAsymmetric, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:ads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ 254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ (/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hgroup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | : stepSi432ze(step:Size_ 78== 0 ? :ncclShme m.cnote: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) Romm.buuffSnizeWs[NCCLo_PROrTO_kSIMPLEC]/NoCCL_SlTEPS/lsizeo, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREedEOp, Fa,nAsym metricN<1, NCCCL_MACX_DEVL_ARITY>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work);_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested herefield 'nthreads' will be initialized after field 'tidInBlock' 432 | if (tid <670 sub | tn) Ru nWor kColl , FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(dtid, )subtn,, work) ;nthreads(nthreads), tidInBloc | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDev_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611Func(AllReduce_TREE_SIMP:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ k(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ LE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nt_PhROTO_SIMPLE]/NCCL_STEPS/sizerof(T) : steepSize_) { a | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hd:63:56: note: sin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | ) Primiti, tidInBlock(thves, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Po, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLrimitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ E_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grou/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] p(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthtidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PRrOeads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ TO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(A/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hllReduce_TREE_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBat:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | ch, algo, proto, tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepunroSll>().irun()z; \ | e ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h(:670:15: snote: field 'nthreads' will be initialized after field 'tidInBlock' t670 | e tid(ptid),S nthrieadsz(nthreeads),_ tidIn Block=(threa=dIdx. x), g0roup ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/s(giroup),z | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.he:670:60o: note: field 'group' will be initialized after field 'stepSize' f 670 | ( tid(tid), nthreads(nthreads), tidInBlock(threadIdxT) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Dire.xc), grtoup(g=roup),* | ^~~~~~~~~~~ /0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthrea/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSds), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, ProtTY>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Op, Proto, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:22:1, COLL_UNROLL>, COLL_UNROL/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthrL>(tid, nthreads, work)eads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, ; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, s:u note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here b22 | DEFINtE_ncclnDe0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreavFun,c(AllR educe_RwING_SIoMPLE_rMinMaxk_u64_4), ncclF;uncAl lReduc e, Fun| cMinMds), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ^ax, ui nt6/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp4_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatchcoll, ty, redop, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | triun(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ d(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group,p algo), pr,oto, unr oll>(| ).r ^~~~~~~~~~~~~~~~~u /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nn(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tidthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid,threads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nt:h670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_)reads, work); | ^ { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_u64_2, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:67011: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670::15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 15670 | : tid(tid ), ntwarning: hreads(ntinitializer order does not match the declaration order [-Wreorder-ctor]hreads), tidInBl ock(threadI670 | tid(tid), nthreads(dx.x), ngroup(grotup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~h | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ reads), tidInBlock(thre 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ffSize group(groups[NCCL _PROTO_SIMPLE]/NCC/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hL_STEPS/sizeof(T) : stepSize_): { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 63| group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h::63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 56 63 | P:rimitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | etric<1>, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | ru Primitives, 0, ProtonRi,ngUNR prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(dtid, Onthrepads, w,ork); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: Pin instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | r ifoto, COLL_UNROLL>(tid, nthreads, work); (tid | < ^ subt n) Run/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hWorkColl, 1, 2, 4>::run' requested here 432 | o, COLL_UNROLL>().run(tid, subtn, w if (tid < subtn) RunWorkColl12:1: (note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here )12 | DE.FIrNE_ncuclDevnFunc((AllRtid, seuduce_bRItn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:22:1NG_SI:MPLE_ MinManote: x_u64in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here_2, n cclF 22 | DEFINE_ncclDevFunc(AlluncARllRedeuce,d FuuncMincMax,e ui_RING_SIMPLE_MinMax_u64n_t64_t4, NCC,L_ALG O_RnING, cNCCclFuL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62ncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROT: note: Oexpanded from macro 'DEFINE_ncclDevFunc' 611 | _ RSunWIorkBatMcPLE, 4h, ^algo, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h: pr611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch().yrun();, \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:r670:15: enote: field 'nthreads' will be initialized after field 'tidInBlock' d670 | op, a l tid(tigd)o, proto, unr, ntohreadls(nthlrea>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: ds), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hfield 'nthreads' will be initialized after field 'tidInBlock' 670: | 670 tid(tid), nthreads(nthreads), tidInBlock:60: note: (tfield 'group' will be initialized after field 'stepSize' h670 | r etiad(tidd),I dnthxreads(.ntx), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIhredadsx), .tidIxnBl)ock,(th reagdIdxr.x), grooup(ugropup)(, g| ^~~~~~~~~~~ roup), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h: 670:15: /warning: initializer order does not match the declaration order [-Wreorder-ctor] *670 | D tid(tiid), rnthreeads(ntchreadts), =tidIn*Block/(threa0dIdx.,x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_S Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkCTEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreoll().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SeUIpDoMwn,4 CO_LL_4UNR,OLL >(tnid,c ntchreladsF, wourk)n; c| ^ A/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hl:432:78l: Rnote: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here e432duce, FuncMinMax, uint64_ | if (tid < subtn) RunWorkColl().t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), runn(titd, hsurbetn,a wodrk)s; (| ^ n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:t17:1h: note: rin instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here e17 | aDEFIdNE_sncc)lDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4, tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock)( | t^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hh:r611:62e: note: expanded from macro 'DEFINE_ncclDevFunc'a d611 | I dRunxWor.kBaxtch), palg(o, gprotrooup), | ^~~~~~~~~~~ , unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gr:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]o 670 | u tid(tid),p nthreads((nthreads)g, tidInBlorck(threadoIdx.x), guroup(grp), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSioup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~z | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | e stepSi(zestepSize_ == 0 ? ncclShmem.comm.b(stuepSize_ ==f 0 ? ncclfShmem.comSm.buffizes[NCCL_PROTSOizes[NCC_L_PROTO_SIMSIMPLE]/NCCL_STEPSPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tiroto, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl work(); | ) ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h.:432:78:r note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here u432 | n if( (tidt < suibtn) dRunWor,kColl (w).run(tid, suobtn, rwork)k; | ); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DE ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllRFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uinted6uce_4RING__SIMPtLE,_M inMaNx_u6C4_4, CncclLFunc_AllRAeducLe, FuncMinGMaOx, ui_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] nt64R_t, NCICL_ANLGO 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSiz_GRING,, NC CNCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: enote: (stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWoL_PrROTOk_SIMBPLE,a 4) t| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hc:611:h62: note: , algo, , redop, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x)p,rot o, ungrollr>().orun(u); \p | ^ (/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:g670:15: rnote: field 'nthreads' will be initialized after field 'tidInBlock' o670 | u tpid(t)id), ,nthr eads (nth| read ^~~~~~~~~~~~~~~~~s), tidI/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hnBlock(:thre670adId:x.x),60 gro:up( grounote: p), field 'group' will be initialized after field 'stepSize' | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :670: 60: note: field 'group' will be initialized after field 'stepSize' 670670 | | t id(t tid(tid), nthreadid), nthreads(nthreads), tidInBlocks(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nt/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, wor/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hk); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunW:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmeormkBatch<.coll,c ty, roedop, algmo, pro.to, unbroll>(u).run(f); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:fSizes[NCCL_PROTO_SIMPLE]/NCC670:15:L note: field 'nthreads' will be initialized after field 'tidInBlock' _ 670 | S tTid(tEid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitivesnthr,eads (nth0reads,), t idInPBlocrk(thoreadtIdx.x), grouop(gro,up ), 0| ^~~~~~~~~~~ > prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64_4, ncclFun/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hcAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidIn:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Block(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64_4, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx942. 21 warnings generated when compiling for gfx90a. 1717 warnings generated when compiling for gfx1102. warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1102. 21 warnings generated when compiling for gfx942. [ 60%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp 21 warnings generated when compiling for gfx90a. [ 61%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cppIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_groupIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ (); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | elId - work->channelLo; | ^~~ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cppIn file included from :2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - woIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ rk->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARPIn file included from _SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthrea/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hds):,670 :t15i:d Iwarning: nBinitializer order does not match the declaration order [-Wreorder-ctor]l ock(threadIdx.x), gro u670p | ( g r o utpi)d,( t i| d ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~) , | n tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_t hreads(nthr e671a | d s ) , sttiedpISniBzleo(cskt(etphSriezaed_I d=x=. x0) ,? gnrcoculpS(hgmreomu.pc)o,m m .| b ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~u f f| S tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_i zes[NCCL_ P671R | O T O _ SsItMePpLSEi]z/eN(CsCtLe_pSSTiEzPeS_/ s=i=z e0o f?( Tn)c c:l SshtmeepmS.iczoem_m). b{ u f| f ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~S i z| e group(groups [NCCL_PROTO_SIMPLE]/NCCL_S/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hT:E254PS:/90s:i znote: ein instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested hereo f(T) : s t254e | p S i z e _ )P r{i m i| t ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~i v e| s group(group , FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested hereX _DEV_ARIT Y303, | 1> , /P*rDiimrietcitv=e*s/<0T,, PRreodtOop,, 0F>a npArsiymmsm e t| ^r ic<1, NCCL_M/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hA:X565_:D5E:V _note: Ain instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested hereR ITY>, / *565D | i r e c tr=u*n/T0r,e ePUrpoDtoow,n <0T>, pRreidmOsp , | P ^ rotoSim/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hp:l565e:<51:, note: 1in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here, COLL_UN R565O | L L > , rCuOnLTLr_eUeNURpODLoLw>n(note: ,in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here COLL_UNR OL432L | > ( t i d , inft h(rteida d, 0, 2, 2>::run' requested hereO p, Algo, 432P | r o t o , CiOfL L(_tUiNdR Ou(b)t.nr)u nR(utniWdo,r ksCuobltln<,F nw,o rTk,) ;R e d| O ^p , Algo, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cppP:r7o:t1o:, note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested hereC OLL_UNROLL >7( | )D.ErFuInN(Et_indc,c lsDuebvtFnu,n cw(oArlkl)R;e d u| c ^e _TREE_SI/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cppM:P7L:E1_:M inote: nin instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested hereM ax_u8_2, n c7c | lDFEuFnIcNAEl_lnRcecdluDceev,F uFnucn(cAMlilnRMeadxu,c eu_iTnRtE8E__tS,I MNPCLCEL__MAiLnGMOa_xT_RuE8_E2,, NnCcCcLl_FPRuOnTcOA_llSRIeMdPuLcEe,, 2F)u n| c^M inMax,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h :u611i:n62t:8 _note: texpanded from macro 'DEFINE_ncclDevFunc', NCCL_ A611L | G O _ T RREuEn,W oNrCkCBLa_tPcRhO, al/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hgo:,611 :p62r:o note: expanded from macro 'DEFINE_ncclDevFunc't 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ o, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: In file included from initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTIn file included from O_LL/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: 1In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:211: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h8:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15:] warning: initializer order does not match the declaration order [-Wreorder-ctor] /670 | NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncc | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ lFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nth:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | , nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.croeadms), timdInBlo.ck(thrbeadIdx.xu), groufp(groupf), S | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ izes[NCCL_PROT | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(TO/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRin) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ g, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthre_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorx), group(group), | ^~~~~~~~~~~ kColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf16_2, ncclFuncAllReduce, Fun 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ cPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, ProtoIn file included from , 0/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp>: 2p: rIn file included from i/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hm:s11 : | In file included from ^/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h :175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h::29565:: 5warning: :field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | ru n496T | r e e Up Dtoiwdn(I,Z CEO)L, Lw_aUrNpR(OtLLi>d(/WtAiRdP,_ SnItZhEre)a,d s| , ~~~~~~~~~~~~~~~~~~ w o| r stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)k ); | ^ 497 | war/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hp:I432nB:l78:o cnote: kin instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here( threadId x432 | . x / W A RP _ifS I(ZEt)id, < | s ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~u b | t warp(tid/WARP_SIZEn ) RunW o498r | k C o l lf| ( ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~) . r| warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3u n(tid, su499b | t n , wsotrekp)S;i z e| ( ^n cclShmem./builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cppc:o7m:m1.:b unote: fin instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested heref Sizes[NCCL _7P | RDOETFINE_ncclDevFunc(AllReduce_TREEO_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthread:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ s(nthreads), In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReductidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ e_RING_SIMPLE_MinMax_u8_2, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUp tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Down, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :670:15: warning: 432initializer order does not match the declaration order [-Wreorder-ctor] | if (tid < s670u | b t n ) tRiudn(Wtoirdk)C,o lnltx()),. rgurno(utpi(dg,r osuupb)t,n , | w ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~o r k| ) tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_; | ^ 671 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp : 12 : 1s:t enote: pin instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested hereS ize(stepS i12z | eD_E F=I=N E0_ n?c cnlcDcelvSFhumnecm(.AclolmRme.dbuucfef_SRiIzNeGs_[SNICMCPLL_EP_RPOrTeOM_uSlISMuPmL_Eb]f/1N6C_C2L,_ SnTcEcPlSF/usniczAelolfR(eTd)u c:e ,s tFeupnSciPzree_M)u l{S u m| , ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ h i| p group(group_ bfloat16, NCCL/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h_:A254L:G90O:_ Rnote: Iin instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested hereN G, NCCL _254P | R O T O _ S IPMrPiLmEi,t i2v)e s <| T^, RedO/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hp:,611 :F62a:n Anote: sexpanded from macro 'DEFINE_ncclDevFunc'y mmetr i611c | < N C C LR_uMnAWXo_rDkEBVa_tAcRhI ,t y/,* Drierdeocpt<=t*y/>0,, aPlrgoot,o ,p r0o>t op,r iumnsr o l| l ^> ().run/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h(:)565;: 5\: note: | in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h: 670565: | 15 : note: field 'nthreads' will be initialized after field 'tidInBlock'r unTree U670p | D o w n (,t hCrOeLaLd_IUdNxR.OxL)L,> (gtriodu,p (ngtrhoruepa)d,s , | w ^~~~~~~~~~~~~~~~~o rk)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h;: 670 :| 60 ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkCo: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ll().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadId/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPL/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ E/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h_:Pr611e:M62u:l Snote: uexpanded from macro 'DEFINE_ncclDevFunc'm _bf16_4 ,611 | n c c l FRuunncWAolrlkRBeadtucche<,c oFluln,c Ptrye,M urleSduomp,< thyi>p,_ bafllgooa,t 1p6r,o tNoC,C Lu_nArLoGlOl_>T(R)E.Er,u nN(C)C;L _\P R | O ^T O_SIMPLE,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :4)670: 15 :| ^ note: field 'nthreads' will be initialized after field 'tidInBlock' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: 670expanded from macro 'DEFINE_ncclDevFunc' | tid (611t | i d ) , RnutnhWroerakdBsa(tncthht,h raelagdoI,d xp.rxo)t,o ,g ruonurpo(lglr>o(u)p.)r,u n (| ) ^~~~~~~~~~~~~~~~~ ; \ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :| 670 ^: 60: note: field 'group' will be initialized after field 'stepSize' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: 670 | field 'nthreads' will be initialized after field 'tidInBlock' tid( t670i | d ) , nttihdr(etaidds)(,n tnhtrheraedasd)s,( nttihdrIenaBdlso)c,k (ttihdrIenaBdlIodcxk.(xt)h,r egardoIudpx(.gxr)o,u pg)r,o u | p ^~~~~~~~~~~( group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ CL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h::670432::1578:: warning: note: initializer order does not match the declaration order [-Wreorder-ctor]in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | i f670 | ( t i d tu(p)(.grruonu(pt)i,d , | s ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~u b t| n tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_, work); | 671 ^ | stepS/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cppi:z22e:1(:s tnote: ein instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested herep Size_ == 0 ?22 | DnEcFcIlNSEh_mnecmc.lcDoemvmF.ubnucf(fASlilzReesdu[cNeC_CRLI_NPGR_OSTIOM_PSLIEM_PPLrEe]M/uNlCSCuL_mS_bTfE1P6S_/4s,i znecocfl(FTu)n c:A lsltReepdSuicez,e _F)u n{c P r| e ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~M u l| S group(group um, hip_bfloat1/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h6:,303 :N90C:C Lnote: _in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested hereA LGO_RING ,303 | N C C L _ P RPOrTiOm_iStIiMvPeLsE<,T 4,) R e| d^O p, FanA/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hs:y611m:m62e:t rnote: iexpanded from macro 'DEFINE_ncclDevFunc'c <1, NCCL _611M | A X _ D ERVu_nAWRoIrTkYB>,a t/c*hDi>, parligmos, p| r ^o to, un/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hr:o565l:l5>:( )note: .in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested herer un(); \ 565 | | ^ runTr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.he:e670U:p15D:o wnote: nfield 'nthreads' will be initialized after field 'tidInBlock'< T, RedO p,670 | P r ot otiSdi(mtpilde)<,1 ,n t1h,r eCaOdLsL(_nUtNhRrOeLaLds>),, CtOiLdLI_nUBNlRoOcLkL(>t(htrieda,d Indxt.hxr)e,a dgsr,o uwpo(rgkr)o;u p )| , ^ | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h::60432:: 78note: :field 'group' will be initialized after field 'stepSize' note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 670 | 432 | t i d ( t i di)f, (nttihdr ea().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.htid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8_4, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1200. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 61%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 17 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 17 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cppIn file included from :2 | ^ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cppIn file included from :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1111: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_groupIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ (); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable]In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_g/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ rIn file included from oup(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - wIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ ork->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from :145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barriieer_rby__grobup(y); _| ^~~~~~~~~~~~~~~~~~ g/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29r:15:o note: expanded from macro 'barrier_by_group'u p29 | ( c)ons;t int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | cons| t ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h :29:i15: nnote: expanded from macro 'barrier_by_group' t 29 | b cionsdt i nt =w = thnrIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t daeacdIdx.x/WARcP_SlIZES; \h | m ^ em.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from ta1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uiIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:nt32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->chann/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const iIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ nt w = threadIdx.x/WARP_SIZE; \ | ^ elLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - wo/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ r/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15:k warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ ->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ e(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(thr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreadIn file included from s)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp,: 2t: iIn file included from d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hI:n11B: lIn file included from o/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hc:k175(: t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.hh:r498e:adIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NeCaCdLI_dSxT.ExP)S,/ sgirzoeuopf((gurionutp6)4,_ t )| ) ^~~~~~~~~~~~~~~~~ { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h::670421::609:: note: note: field 'group' will be initialized after field 'stepSize'in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | 670 | tpirdi(mtsi(dt)i,d ,n tnhtrheraedasd(sn,t htrreeaed-s>)d,o wtni,d ItnrBeleo-c>kd(otwhnr,e awdoIrdkx-.>xs)e,n dgbruofufp,( gwroorukp-)>,r e c| v ^~~~~~~~~~~b uff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ .x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreaIn file included from d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from s/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ (nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto ,670 | u n r o ltli>d(()t.irdu)n,( )n;t h\ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ reads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_nc:670:15:clDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group):670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ atch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p, Proto, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx942. [ 61%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:In file included from 27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cppIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h::145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTrePLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ eUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TR/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ EE_LL128_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().r(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ un(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/si:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ zeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tIn file included from id < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid)^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx908. 21 warnings generated when compiling for gfx942. 21 warnings generated when compiling for gfx90a. [ 61%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp 21 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, daIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ta2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: :15: unused variable 'data2' [-Wunused-variable]note: expanded from macro 'barrier_by_group' 29 | co nst int w = t145hreadId | x.x/WAR P_SIZE; \ | ^ In file included from uint32_t data1, flag1, data/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelIdIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5In file included from : warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h const int w = threadIdx.x/WARP_SIZE; \ | ^ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_gro/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ up(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.chIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h | ^ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ annelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28::366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrie:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ r_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2;/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int expanded from macro 'barrier_by_group'b 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ id = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t daIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ ta1, flag1/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ , data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unrdoop, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.com:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611Algo, Promt.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ o, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, :62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here In file included from 565/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), | n trunTreeUhreads(nthreads), tidInBpDolwn,I COLdL_UNxROLL.>(tixd, nt)hr,ead s, wogrk);r | ^o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hup(group), : 432:78: | note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | st if (tid < subtn) RunWorkColl().| run(ti group(groupd, sub tn, wo/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hrk); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | D:EFINE254_nc:clDevF90unc(Al: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oat, NCCL_ALGO_TREE, NCCL_DEV_ARITY, 1>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_PROTUO_SIMPNLE, 2)R | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hO:611:62:L note: expanded from macro 'DEFINE_ncclDevFunc' 611L | >(tid, nthreads, work); | ^ Run/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hWorkBatch<:coll432, ty:, re78dop<:ty>, algnote: o, pin instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested hereroto , un roll>()432.run | (); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads (if (tnidthre ().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEx),F groIup(gNroupE), _| ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hncclDevF:u670:60:n note: field 'group' will be initialized after field 'stepSize' c 670 | ( tAid(tlid),l nthReduce_TREE_readSs(ntIhreaMds),P tLidInEBloc_k(thPreMulSum_fre3adId2x.x)_, gr2oup(g,roup), | ^~~~~~~~~~~ ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | | tid(tid) , nthr eads(nt hreadsr), tidIunBlockn(threaRdIdx.x/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' )i, grounp(groupg),< | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~T | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ , 671 RedOp, ProtoOLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , COLL_UNROLL>(tid, nthreads, wo | r stepSkize(st)epSize_; == 0 ? nccl Shmem| .comm. ^buffSi zes[NC/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hCL_PR:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | O TO_SIMiPLE]/NfCCL_ST EPS/s(izeof(T) tid < subtn) RunWorkColl, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303L | LPrimit_ivesUNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1, 1, 2, 2>::run' requested hereic<1, NCCL_M AX_DEV_AR12ITY>, | In file included from DEFINE_ncclD/e*Dir/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCecvt=*/0, FPrunot/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cppc:2: (AllRo, 0e> prdIn file included from iuce_RING_SIMPLE_Prmes | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here M/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h: 11: In file included from u/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:l565498:29: S | warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] u 496 | m tid(_ tid f)32_2, ncclrunTreeUpDown, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ARllPReduc_e, FSuncPreIMulSumZ, floaEt, NCC)dOp, ProtoSimple<1, 1, COLL_UNROLL>, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:L432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _ALGO_RING, NCCL_PROTO_SIMPLE, , 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | | R ~~~~~~~~~~~~~~~~~~ u | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)n 497 | warpWInBloock(thrreadkIdx.Bx/WAaRP_StIZE)c, | h ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ <| warp(tid/WARP_SIZE coll, ty, redop ,flag Threaad((ltid%g4)=o, proto, unroll>().=r3),u grounp(gro(up),) | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~; | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h stepSize(ncclShmem.comm.buffSizes[NCCL_PRO:670:15:T note: field 'nthreads' will be initialized after field 'tidInBlock' O 670 | _ tLiLd(t1id),2 nt8hreads(nthreads), tidInBlock(threadIdx]/.NCCLx_ST)EP, group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60S/s:iz eofnote: (uinfield 'group' will be initialized after field 'stepSize't64 _t )) { 670| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h : 421:9 : note: tin instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here i421 | d ( t priid), nthreads(nthreads), tidInBlock(threamsd(tiId, dnthxreads, tree.->dxown), t,ree- >dogwn,r woork-u>psen(dbufgf, rwoupork->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | ), | ^~~~~~~~~~~ runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlocIn file included from k(threadIdx.x/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:)2, group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthrea: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hd:11: sIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:(175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.hn:498:29t: warning: hfield 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] r496 | e a tidd(tisd), nthreads(nthreads), wid(tid%WARP_SIZE), warp), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, //builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] *Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COL 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ L_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ op, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hads(nthr:670:15e: warning: initializer order does not match the declaration order [-Wreorder-ctor]a 670d | stid()tid),, nt thidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: rfield 'group' will be initialized after field 'stepSize'eads(nthread s), tidIn670Blo | ck(t hrea dIdx .x), groutp(grioup)d, | ( ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ tid)=, nt=hrea 0 ? ncclShmds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ em.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitive/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hs, 0, warning: Pinitializer order does not match the declaration order [-Wreorder-ctor]ro to, 0> prim670s | | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthr e tiad(tdid)s, nt,hre adsw(ntohrk); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.coomrkCmoll.().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSu: stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /m,* flDoati, NrCCLe_ALcGO_RING,t NC=CL_*PRO/TO_0SI,MPL E, Proto, 0> 2) p | ^r /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hi:611:ms | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h62: note: expanded from macro 'DEFINE_ncclDevFunc' :611565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDow | n , algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tieddOp,( tProitoSdimpl)e<1,, 1 , CnOLtL_UhNROrLL>e, aCOLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | ds (nt hre adsi), tfidI nBl(ockt(thiread < subtn) dRIdxu.x)n, Wgrooup(rgrokupColl().run(ti), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ d, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group)In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h, | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670::175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ 60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(thre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670 : 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid)adIdx.x),, group( group), n | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ t671 | sthepSize(srtepSize_ e== 0 ? nacclShmemd.comm.bufsfSizes[NC(CL_PROTOn_SIMPLE]/NtCCL_STEPShreads), tidInBlo/sizeof(cT) : stke(pSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | PrimthreadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_)it ives{, 0 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~, Proto, 0> prim s | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h| group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:558::5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 90 558 | : runRi ng, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested hereto, COLL_ UNROLL>( tid, nth303 | reads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if ( Primitives, /*Direct=*/0, Prtid p, Al go, Prpotorims | ^ ,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h COLL_UNRO:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565LL>() | .run (tid , runTreeUpDown, 1, 2, 2>::run' requested here 112 | DEF,INE_nc clDCOLL_UNROLL>, COLevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncAllReducL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | e, FuncPreMulSum, fl RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oat, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PRO/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ TO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | , g roup(g roup)s, | ^~~~~~~~~~~~~~~~~ t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:e60: note: field 'group' will be initialized after field 'stepSize' p 670 | S tidi(tid),z nthreeads(n(threadss), titdInBloeck(threpadIdx.Sx), grioup(grzoup), e | ^~~~~~~~~~~ _ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthrea/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREEup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSiz/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.e(stepSize_ == 0 ? ncclShme, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tibuffSid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ zes[NCCL_PROTO_SIMPLE>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if]/NCCL_STEPS/size (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ of(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ symmetric, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hTREE_SIMPLE_Pre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>(:)670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]. 670 | r tidu(tid),n nthrea(ds(nth)reads),; tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffS:670:i15: warning: zinitializer order does not match the declaration order [-Wreorder-ctor] 670e | tsid(tid)[, nthNreads(nCthreadCs), tidLInB_lock(thPreadIdRx.x), gOroup(gTroup),O | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ _ \ | S ^ | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:I670 tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_:15: Mnote: field 'nthreads' will be initialized after field 'tidInBlock' P 670 | L tid(tE671id), ] | nthre/a ds(nNth readC s), tC idInBLsl_STEPS/tepSize(stepSize_ == 0 ? ncclShockm(thereadmIdx..x), group(gcrooup),m | ^~~~~~~~~~~~~~~~~m /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:.670:60:b note: field 'group' will be initialized after field 'stepSize' u 670 | f tfid(tSid)izes[NCCL_PROTO_SIMPLE]/NC, nthreads(nthreads), tidInBlock(threadIdx.x), group(gsizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /CL_S*TEPDS/siizeofr(T) e: stecpSizte_) {= | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~* | group(group/ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h0:63:,56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | PrimitivesrPoup prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runT RedOp, FanSymmetric<1>, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, reeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, 1, 2, 4>::run' requested here C 432 | if (tid < subtn) RunWorkColl(O).LrL>(un(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_).run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncRPINGr_SeIMMPLuE_lPrSeMuulmSu, m_ff3l2_o4,a ntcc,lF unNcAlClCReLduc_e,A FLunGcPOre_MuTlSRumE, Efl,oa t,N NCCCCL_LAL_GOP_RRINOG,T NOCCL__PSROITOM_SPIMLPLEE,, 4 ) 4 | )^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: | ^note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gr>(o).urupn(();g \r o| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hu:p670:)15:, note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), ti| ^~~~~~~~~~~~~~~~~d /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hI:670:60n: Bnote: field 'group' will be initialized after field 'stepSize'l 670 | o c kti(d(ttihd)r, entahrdeaIdsd(nxth.rexad)s), tidInBlock(threadIdx.x), ,g grrooupu(gpro(up), g roup), | ^~~~~~~~~~~ | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE,| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMu/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_4, ncclFlSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroluncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ l>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclS Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>In file included from (tid, nthreads, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWor(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, PrkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ oto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | Ptroto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ id(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ cclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1200. 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx906. 21 warnings generated when compiling for gfx942. [ 62%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1102. [ 62%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.head, mantissa; | ^ :14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ , flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_grIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ oup(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = thre:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ adIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | In file included from const int bi | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ d = ncclShmem.channelId - work->channelLo; | ^~~ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flagIn file included from 1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ ata2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShm/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ em.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flaIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h::670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, CO11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ g1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ LL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp::11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from :498:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: 29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunW ProotoSimple<1, 1, COLL_UNROLL>, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ rkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threIn file included from adIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h: 11671 | : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hstepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | :145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STE, nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hPS/sizIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_grou:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | p(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = const int threadIdx.x/WARP_SIZE; \ | ^ In file included from eof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 027:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_grou:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_Pp(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = tROTO_SIMhreadIdx.x/WARP_SIZE; \ | ^ PLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, workIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grouIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group()_t data1, flag1, data2, flag2; | ^~~~~ p), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ; | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, pIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ hreadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] roto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:67015: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | | tid(t id), nthrea ds(nthreads ), tidInBl ock(threatdIdx.x), igroup(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ d(tid), nthreads(nthreads), tidInBlock(thr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ eadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = nc.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ clShmem.channelId - work->channelLo; | ^~~ (tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | ste/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tIn file included from pSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56id(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ?/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ /NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | P), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ rimitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nt/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSihreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ze_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads)roup(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_n cclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ .buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid( tid), nthreads(nthreads)496 | tid(tid), nthreads(nthrea,d tidInBlocks(threadIdx).x), grou, wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ p(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buff/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreadsS(izes[NCCL_PnROthreaTOds), tidInBlock(threadIdx.x), grou_pL(Lg1r2o8u]p/)N,C C | L ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~_ S T| E tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_P S/sizeof(uin t6716 | 4 _ t ) )s t{e p S| i ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~z e (| s group(groupt epSize_ == 0 ? ncclShmem./builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hc:o63m:m56.:b unote: fin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested heref Sizes[NCC L63_ | P R O T OP_rSiImMiPtLiEv]es/Ne,p S0i,z eP_r)o t{o , | 0 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~> p| r group(groupi ms | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: 1062note: | in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here runRin g254< | T , R e d OPpr,i mPirtoitvoeLsL<1T,2 8R,e dCOOpL,L _FUaNnRAOsLyLm>m(ettirdi,c , /*Dire/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hc:t432=:*78/:0 ,note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested hereP roto, 0> 432p | r i ms | ^if (tid , ProtoSimple<1, 1, 4>, 4>' requested hereR unWorkC o565ll | < F n , rTu,n TRreedeOUp,p DAolwgon,< TP,r oRteod,O pC,O LPLr_oUtNoRSOiLmLp>l(e)<1.,r u1n,( tCiOdL,L _sUuNbRtOnL,L >w,o rCkO)L;L _ U| N ^R OLL>(tid/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp,: 10:n1t:h rnote: ein instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested herea ds, work); 10| | ^D EFINE_ncclDe/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hv:F432u:n78c:( Anote: lin instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested herel Reduce_R I432N | G _ L L1 2 8i_fP r(etMiudl SL(_)A.LrGuOn_(RtIiNdG,, sNuCbCtLn_,P RwOoTrOk_)L;L 1 2| 8 ^, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:: 611note: :in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here62 : note: expanded from macro 'DEFINE_ncclDevFunc' 17 | D E611F | I N E _ nRcuclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STE/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ 432= | = 0 ? nicfc l(Sthimde e(p)S.irzuen_()t i{d , | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~s u b| t group(groupn , work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp::6317::561:: note: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested herein instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 63 | 17P | rDiEmFiItNiEv_enscS,I M0P,L EP_rPorteoM,u l0S>u mp_rfi8m_s4 , | n ^c clFunc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hA:l558l:R5e:d unote: cin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested heree , Func P558r | e M u l Sruumn,R irncgc_(PtRiOdT,O _nStIhMrPeLaEd,s ,4 )w o r| k^) ; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hnote: :expanded from macro 'DEFINE_ncclDevFunc'432 :78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 611 | R u432n | W o r k B a ticfh <(ctoildl ,< tsyu,b trne)d oRpur,k Caollglo<,F np,r oTt,o ,R eudnOropl,l >A(l)g.or,u nP(r)o;t o\, C| O ^L L_UNROLL>().r/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hu:n670(:t15i: dnote: , field 'nthreads' will be initialized after field 'tidInBlock's ubtn, wo r670k | ) ; | ^t id(tid), n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cppt:h22r:e1a:d snote: (in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested heren threads), t i22d | IDnEBFlIoNcEk_(ntchclrDeeavdFIudnxc.(xA)l,l Rgerdouucpe(_group), | ^~~~~~~~~~~~~~~~~ R/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ING_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Size_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' , 1, COLL_UNROLL>, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCC tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ L_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffS/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(izes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ AllReduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx906. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 62%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx 29 | const int w .= threadIdxx.x/WARP_/SWAIZREP_SIZE; \ | ^; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from In file included from :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SI/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from Z/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174E: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7:; warning: unused variable 'w' [-Wunused-variable] 75 | \barrier_ by_gro up();| | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: ^29:15: note: expanded from macro 'barrier_by_group' 29 | In file included from const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp | :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h :174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145 :14: warning: unused variable 'data1' [-Wunused-variable] 145 | u uiint32_tnt32_t data1, flag1, d dataa1, fltag1, daata2, 2flag2;, | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h :145:21:f warning: unused variable 'flag1' [-Wunused-variable] 145 | lag2; | ^~~~~ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145; | | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h :145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uiunt32_it danta1, ftlag1,3 data22, fl_ag2;t d | ^~~~~ata1, flag 1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int In file included from In file included from bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: =In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h :80:5:t warning: unused variable 'w' [-Wunused-variable] h80 | r barreier_by_grouap(); d| ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hI:29:15: dnote: expanded from macro 'barrier_by_group' x29 | .constx int /w :=366W:15 : warning: Aunused variable 'bid' [-Wunused-variable]t R366h | P r c_onsetS inIat bdZE;Idixd = n\.cclx Shmem | ^ /WARP_SIZE; \ | ^ .channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable]/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelI 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ d - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - :218:15:w warning: unused variable 'bid' [-Wunused-variable] o218 | r conkst int -bid => ncclcShhanmem.nchanneellId - Lwork-o; | ^~~ >channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | c/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.honst int bid = nc:366:15c: warning: unused variable 'bid' [-Wunused-variable] l 366 | S hconstm int ebid = mn.channelId - work->channelLo; | ^~~cclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threaIn file included from dIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); 29 | | cons ^~~~~~~~~~~~~~~~~~t int w = thre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hadIdx.x/W:ARP_SIZE29; \ :| 15: note: ^ expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2ZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | ui: nIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174t: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: 3unused variable 'data1' [-Wunused-variable] 145 | 2 uint32__t data1,t flag1, data2, fdlag2; a | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:t145:21: warning: unused variable 'flag1' [-Wunused-variable]a1, 145 | flag1, udinata2, flagt32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1,2 data2,; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp::218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->chanIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ nelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] In file included from 145 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | bar uint32_t data1, flag1, data2, flag2; | ^~~~~ rier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem./builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:145:28::218: 15: warning: unused variable 'bid' [-Wunused-variable] warning: 218 | unused variable 'data2' [-Wunused-variable] 145 | const inut bidin =t32_t data1, f nccllShmema.channg1, delId - woatrk->channelLo; | ^~~ a2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->chanIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:nelLo; | ^~~ 173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | In file included from tid(tid), nthreads(nthre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from a/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | d s), tidI nBlock(stepSithrezadIdx.x), geroup(gr(oup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ s | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | t stepepSize_ == 0 ? ncclShmem.Sicze(steopSize_mm.buffSizes[NCCL_ ==P 0 ? nRcclShmeOm.commT.buffSOizes[N_CCL_PSROTOI_SIMPLME]/NCCPL_STEPLS/sizeEof(T) :] stepS/ize_) N{CCL_ | S ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ TEP | group(group S/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/siz:eof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here c 254 | < PrNimitiveCs, /*DEirect=V*/0, Pr_otoARITY, 1>, /*Direct=*/0, Proto, 0> ,prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h0:565:5:> note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | rpunTrims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565ree | UpDown , COLL_UNROLL>(tROLLi>, COLdL_UNROL,L>(ti d, nthreads, workn); | ^t /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432h:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested herer 432e | ads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if ( if (ttid < isubdtn) Ru nWorkC().Op, Algo, Proto, run(tCid, suObtn, worLk)L;_UNROLL>().ru | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here n(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_n7c | DEFINcE_ncclDlevFuDnc(AllReeduce_TvREE_SIFMPunc(AllReduce_TREE_SIMPLE_PLreMEulS_um_Pu32_r2, encMcluFunlcAlSlReduucem, F_uncuPre3MulS2um,_ ui2n, ncclFuncAllReduce, FuncPreMut32l_t,S NCuCL_AmLGO,_TR EE,u NCiCL_nPROTtO_S3I2MPL_E, t2) , NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch re,dop , allgog, o,pro to,p unrrolol>()t.ruon(),; \ | u ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hn:r670:15:o note: field 'nthreads' will be initialized after field 'tidInBlock'l l670 | > (tid)(ti.d)run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(,t nthhreards(enthareadds)I, tdidIxnBl.ockx(th)rea,dId x.xg), rgrooup(ugpro(up),g | r ^~~~~~~~~~~~~~~~~ o/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:u670:60p: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), ntthrieadds),I tindInBBloclk(tohrceadkIdx(.x),t grhoupr(greoup), | a ^~~~~~~~~~~ dIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_S/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ mem.comm.buffSizes[NCCL_PROTO_SITEPS/sizMeof(T) :P stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ =*D= 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ irect=*/0, Proto, 0> priLE]/NCmCL_STEPsS/sizeo f(T) : stepSiz| e_) { ^| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | : Prim565itives:, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTX_DEV_ARITY, 1>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | reeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | ru nTreeUpDiown,t COLL_iUd < subtn) RunWorkColl,(tid, n threadTs, work,); | RedOp, Algo, Proto, COLL_UNRO ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hL:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested hereL 432 | > i(f (tid < subtn) RunWorkColl, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCRLOLL>_().rPun(tRid, OsuTbtn,O work_); S| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cppI:7M:1: Pnote: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here L7 | DEEFINE,_ncc lDev2Func)(All Red uce_| TREE_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMP^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group)LE, ,2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h| : ^~~~~~~~~~~~~~~~~611:62 : note: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hexpanded from macro 'DEFINE_ncclDevFunc' 611: | 670 R:unW60ork:Bat ch, algo, proto, unroll>().run(); \ | In file included from ^/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlocknote: field 'group' will be initialized after field 'stepSize' ( 670t | h trid(teid)a, ndthreIadsd(ntxhre.adsx),) ti,d group(grouInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p )| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), ti:670:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ 15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 dInB?lock(thre adIdx.x)n, groupc(group), c | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_l 671 | S stepSizeh(stepSizme_ == 0 em.comm.buffSiz? nes[NCcCclShmem.Lcomm.buf_fSiPRzeOTO_SIMPLE]/NCs[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | CL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | Pri ^mitives , ProtoSimple<1, 1, 4>, 4>' requested here CL_MAX_DEV_ARITY, 1>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWor>, COkLL_UNCROLL>(otid, lnthrelads, , 0, 2, 2>::run' requested here 432T | , RedOp, Algo, Proto, CO if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_nccLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_ulD3evFu2nc(_AllR4e,duce_ TREEn_SIMcPLE_cPreMlulSuFm_u32u_2ncAllReduce, FuncPreMulS, nucclFmuncAl,lRed uce,u Funicnt32_t, NCCL_ALGO_TREE, NCCL_PPreRMuOlSTumO, _uiSntI32M_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2P)LE , 4| ) ^ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62:: 611note: expanded from macro 'DEFINE_ncclDevFunc': 62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | R611 | u n RWunoWorrkkBaBtcah, algo, proto, unrollty>>,( a)lgo.,r puronto(, )un;ro ll\> () .r| un ^() ; /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | t\i d| ( ^t /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hi:d670:)15:, note: field 'nthreads' will be initialized after field 'tidInBlock' n t670 | h r teida(tdids(),n threads), tidInBlock(threadIdx.x), group(nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: grfield 'group' will be initialized after field 'stepSize'ou p ), 670| ^~~~~~~~~~~~~~~~~ | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :670 :60 : tnote: field 'group' will be initialized after field 'stepSize'i d670( | t itidd()ti,d) , nntthrheardse(nathdreasds(),nthreads )tidInBlock(t, htireadIddIxnB.loxck()th,re adgroupI(dxg.xr), goup), | ^~~~~~~~~~~ roup(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmeIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tim.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=d%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThre*/0, aProto, d0> prims ( | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:(565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here t565 | riunTreeUpd%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmemDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) Ru.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | nW orkCo ll(().run(tid, nthreads, tree->down, treet-id,> subdtn,o wwork)n; , | ^w /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cppo:7r:1:k->sendbuff, work->recvbuff, work->red note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FOpArg); In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplituin(t32t_t,i NCdCL,_AL GO_nTREtE,hreads, work); | ^ NCCL_PRO/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hTO_:SIM432PLE:, 278) : note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432| | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h :611: 62: if (tid < subtn) Rnote: expanded from macro 'DEFINE_ncclDevFunc' u611n | W o RurnWokrkBCatcoh, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' o670t | o, COL L_U NRO LL>t().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:5:1id:(ti note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllRd), enthdreadus(ncthreead_s),T tiRdInEBlock(threEadIdx.x)_, grLoupL(gr1oup2), 8 | ^~~~~~~~~~~~~~~~~_ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:P670reMulSum_u32_2,:60 : note: nfield 'group' will be initialized after field 'stepSize' c670c | l FuncAllReduce, FuncPreM utidl(tidS), untmhre,ads (ntuhrineadts),32_t, NCCL_ tAidILnBlGock(threadIdx.x), group(group)O,_TR EE, NC| CL_ ^~~~~~~~~~~PRO TO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h().run:670:15: warning: (tinitializer order does not match the declaration order [-Wreorder-ctor]id, sub t670 | tid(tid), nthn, wrork)e; | a ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cppd:5:1s: (note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here :n670: t15: warning: hinitializer order does not match the declaration order [-Wreorder-ctor] 5 r670 | e | a dtiDds(tE)id)F,, nIt hrNteadsiE(ntd_hreInadsnc)B,lock(threadclDeIvFundc(AlxlR t.eidInxdBlo)c,k(th readguIdxrc.oup(group), e_xT),| REE_LL128_PreM grulSum_u32_2,oup( grnoup)c, c| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ l| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ F671 | u stnep ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~Sc | i tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ z 671 | e A( l sstleptSReize(pstepSSieze_id ==uz ce, FuncPree_ ==MulS u0 ? mncc,l0S ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ uhmintem.com32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: m.buffSizes[note: NCCexpanded from macro 'DEFINE_ncclDevFunc'L_P ROT O_SIM611P | L E]/ NCC L_S TEPRS/suizenof(WT) o: srtepkSiBze_a) {t c| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~h, algo, proto, unroll>().run() ;| group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives \ | ^ , /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nth/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hreads(nthreads), tidInBlock:(threadIdx.x), group(group), 670:| 15: ^~~~~~~~~~~warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2);: | In file included from ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:432::78:11 note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] | i496f ( | tid < su bt n) Rtid(tid), nthreads(unnWorkColl()t.hreradsu), n(tid, subtn, wwid(otidr%WAkRP_)SIZ;E), war p(t| id/W ^ARP _/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cppSIZ:E),7 :| ~~~~~~~~~~~~~~~~~~ 1| stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) : 497 | note: win instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested herearpI _PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nB lock(7th | DEFINE_ncrceadlIdxD.x/eWARvP_SFIZEu), nc(AllReduc| e ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread(_(TREtid%4)==3), gE_rSIMoPLEu_PpreM(ulSgurm_uo32_u2, ncpclF), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | unc warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3All Redu ce499 | stepSize(nc, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().clShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCinitializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ CL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RIN:G670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(:t670:15: iwarning: initializer order does not match the declaration order [-Wreorder-ctor] d670 | ) tid(t,id), nth reads(nnthretads), htreads(nthreads), tidInBlock(threadIdidInxBloc.k(threxadIdx.)x), gro,up(gro up), | group(group), ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ s | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | tepS ize(s tepSistepze_ Size(stepS=i= 0 ? zncclShe_ mem.comm.buffSizes[NCCL_PROTO_SIMPLE]== 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here /NCCL63_STEPS | /sizeo f(T) : stepS ize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ P| group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hr:303:90: inote: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here m303 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hY>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | r:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | ifun TreeUp(Down,u COLL_bUNROLL>t(tid, nnthread)s, RunWorkColl, 0, 2, 4>::run' requested here o432 | , if (CtidOLL_U < sNubtnROLL>().r) RunWorkColl, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMLLu_UNRlOLL>S().ruun(tmid, _subtnu, wo3rk);2 | ^_ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp2, ncclFuncAllReduce, Fu:17:n1: note: cin instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here P17 | DErFINEe_nccMlDeulSum, uint32_t, NCCL_ALGO_vRFunIc(ANllRGeduce_TREE_,SIM PNCLE_CPreL_PROTOMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO__STIMPLRE, E2)E , | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hN:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' C 611 | C RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: 4) field 'nthreads' will be initialized after field 'tidInBlock' | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h :611:62:670 note: expanded from macro 'DEFINE_ncclDevFunc' | 611 | R unWo rkBtatcih,, al go,n prtotoh, unrrolel>(a).rds(nthreads), tidInBlock(threadIdx.xun(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock()t, hgroreadIdx.x)up(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlo, g/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hcroukp(g(routp),h | r ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.he:670a:60:d note: field 'group' will be initialized after field 'stepSize' I 670d | x t.id(xtid)),, n thrgeadrs(ntohureapds:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (group), | ^~~~~~~~~~~ ), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadI:670:15: dwarning: initializer order does not match the declaration order [-Wreorder-ctor] x670 | ti.d(tid), nxthreads()nthreads,), tidInB lock(thregadIdx.x)r, ougrp(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~oup (group) | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_, | 671 | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ stepSiz671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCLe(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives<_STEPS/Tsizeof(,T) : ste pSize_) {R | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ e| group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:d63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here O 63 | Prpimitiv,es< FanAsymmeT, RtedOp, Fric<1, NCCanSymmetLric_<1MAX_DEV_A>, R0, IProto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gr 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] (); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(g/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threaroup), | ^~~~~~~~~~~ dIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:note: field 'group' will be initialized after field 'stepSize' 11670 | : tiIn file included from d(t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hid), :nthre175ads(nt: hrea/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.hds),: tidI498nBloc:k(thr29eadId17 warnings generated when compiling for host. :x.x), grouwarning: p(grofield 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]up), | ^~~~~~~~~~~ 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPL/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primiti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ves, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), groruunTreeUppDown, )COLL_UN,ROLL>(ti d, n | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == threa0ds, wor k); ?| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h: 432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested heren 432 | c clShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/siz if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ L_UNReof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | OLL>(P).run(rtid, isubtnm, worki); | t ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17i:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested herev es17ed, 0, Proto,uce _TRE0E_SI>MPL prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | E_P reMulrSum_u3u2_4,n ncclFuRncAlliReducneg, (tid, nthFruncPreeMulSaum, uidnt32_st, NC,CL_AL GO_TRwEE, NCCL_PROTO_SIMPork); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, Palgo, rprotoo, unrto, COLL_UNROLL>().runoll>(().runt(); \i | ^ d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:,15: subtn, w note: ofield 'nthreads' will be initialized after field 'tidInBlock' r670 | k); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc ( A tlid(tild)R, entdhrueacdse(n_thRreIadsN),G t_idSInBlock(threadIdx.x), group(group)IMPLE_PreMulSu, m| ^~~~~~~~~~~~~~~~~_ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:u60:3 note: 2field 'group' will be initialized after field 'stepSize'_4, ncclFuncAllReduce, FuncPre M670u | l Su tmid,(t idu),i nnthtre3ad2s(_ntthr,ea ds), tNidICnBCloLck_(tAhrLeaGdIOdx_.xR),I gNroGup,(gr ouNp)C, C | L ^~~~~~~~~~~ _PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads),/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | runsTreeUptDownS, COLLi_UNROLzL>(tide, nthr_eads, work)=;= 0| ^ ? ncclSh /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hm:432:78e: m.comm.buffSizesnote: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here [432 | N C if (CL_PROTOtid < _suSIMPLE]/NCCbtn) RunWorkColl, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx942. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1101. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. 21 warnings generated when compiling for gfx90a. [ 62%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, da_t datta1, flaag1, data22, flag2;, | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h: 145:21: warning: unused variable 'flag1' [-Wunused-variable]f 145 | l uinta32_g2; | ^~~~~ t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h data1, f:145:21: warning: unused variable 'flag1' [-Wunused-variable] lag1 , data2145 | u, fliag2; nt32_t data1, | ^~~~~f /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28:l warning: unused variable 'data2' [-Wunused-variable] 145ag1, data2, f | l uint3a2_t data1g2; , flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1,32_ t dadata2, flag2; ta 1, f| lag1 ^~~~~, dat a2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1111: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:: 175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:In file included from 80:5/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: : note: warning: unused variable 'w' [-Wunused-variable] expanded from macro 'barrier_by_group'80 | bar rier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | 29 | const int w b= thraeadIrdx.rx/WARPi_SIZEe; \ r| ^ _by_grohrueadIdpx.x/WA(RP_S)IZE; ;\ | ^ | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = nc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLclShomem.c;han nelId -| ^~~ work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h15: warning: unused variable 'bid' [-Wunused-variable] 218 | co:n218:15:s warning: unused variable 'bid' [-Wunused-variable] t218 int bid = ncclShmem.channelId - wor | kconst- int >bid = cncchlShamem.cnhannenlId -e wlLo; | ^~~ ork->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->ch:366:15a: warning: unused variable 'bid' [-Wunused-variable] n 366 | n conest inlt bidL = ncoclShm;em.ch ann elId| - wo ^~~rk->c hannelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | In file included from ^~~~~/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, fIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ lag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_grouIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threp(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ adIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: 27 | note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ const int bid = In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->chncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | constannelLo; | ^~~ int bid = ncclShmem.channelId - work->chaIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ nnelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, In file included from fl/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ ag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(n: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buftfhreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Sizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? nadIdx.x), group(group), | ^~~~~~~~~~~ cclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15:stepS ize(stepwarning: Sizinitializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(te_ == id), 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEnthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSiPzS/sizeeof(T) : sstepSize_[) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ N | group(group C/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: Cnote: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | L Prim_itives,T /*) : sDirecttep=*/Size_) {0, Proto/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDow | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | n< ^T, Re dOp, P/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hr:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | ot oSimpl runRing, COOLL_UpNROLL,>(tid, nthreads, w orkP); | ^r /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:o432:78t: o, COLL_UNROnote: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here L432 | L i>f (t(tid, nthreads, worid k< subt)n) Ru;nWork Co ll().r| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncunc(tidl, subtn, woDrk);e | ^v /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:F7:1:u note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here n 7 | cDEFI(NE_nAcclDlevFulnc(ARllReeduce_TdREE_SuIMPLcE_ 1>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ PereM_ulSuRm_u6I4_2,N nccGlFun_cAllSReduIce, MFuncPPreMuLlSumE, u_int64_t, NCCL_PAreMuLlSGuO_TREE, NCCL_PROTO_SIMPLE, 2) m_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, N| ^ C/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:C611:62L:_ note: expanded from macro 'DEFINE_ncclDevFunc'P 611R | O RTunOWork_BaStchIe, aldgo,o prpoto<, utnroyll>>().r,un( ); a\ lgo, proto, unr | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | o ^~~~~~~~~~~~~~~~~ll >/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthread:s670:60): ,note: field 'group' will be initialized after field 'stepSize' t670i | dInBl o ctikd(t(idt)h, rntheradIdx.x), group(egarodsu(npth)re,ad s) , | t ^~~~~~~~~~~~~~~~~id In/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hBloc:k670(t:hr60ea: note: field 'group' will be initialized after field 'stepSize' 670 | dIdx .xt),i gdro(upt(giroudp)),, nthreads(nthreads), tidInBlock(threadIdx.| ^~~~~~~~~~~ x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint6/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h4:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadI_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unrIn file included from oll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, nthreads(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthsubtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ reads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSizIn file included from e/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from (stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: 173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15 : warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tiPd), nthreadrs(nthrieads),m tidInBlock(threadIdx.ix), grotives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, IMPLCE]/NCOCL_STLEPS/siLzeof(_T) : sUtepSiNze_) {R | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~O | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hL:254L:90: note: >in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254( | t Pirimitdives<,T, Re dOp, nFanAstymhremetads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hric, 0, 2, 2>::run' requested here , 1>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1:565 | note: ruin instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested herenTre eUpD own, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkCo, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ll().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ dInBlo ck(threadId671x.x), gr | oup(gro up), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSiz steepSize((sstepSize_ == 0 ? ncclShmem.comm.tepSibze_ == u0 ? ncclSfhmem.cofmm.buffSSiizes[NCCL_PROTO_SzeIs[NCCL_MPROTO_SPIMPLE]LE/N]/NCCL_CCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidIIn file included from nBlock(thre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ adIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NC/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ CL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid)In file included from , nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInB/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hlock(threadIdx.x), :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), nthreads(nthreads), gtidInBlroup(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64__UNROLL>, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x) note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) R, ugroup(ngroup)W, | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | o tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | r kstepSiCze(stoepSizel_ == 0l ? nc, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here L303 | Pri_UmNROLL>i().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDev/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid)Func(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, tivesu, /N*DireCct=*/0C, ProLto, 0>_ALGO_TREE, NCCL_PRO prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ toSimple<1, 1, COLL_UNROLL>, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: Tnote: O_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grou/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ze(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx./builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(thx), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ readIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h | :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthstepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTnthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkCollO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadId/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ x.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1030. [ 62%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h::12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from 18/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77::18 warning: unused variable 'y' [-Wunused-variable] 77 | uin: warning: unused variable 'y' [-Wunused-variable]t 77 | 3 uin2t32_t y,_ head, matntissa y, head, mantis; | ^ sa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from lS/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hhmem.ch:annelI173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] d - work->channelLo; | ^~~ 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ .channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: dIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80a:5: warning: unused variable 'w' [-Wunused-variable] t80 | baarrier_1by_group,(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:f15: note: expanded from macro 'barrier_by_group' l29 | coanst intg w =1 threadId,x.x data2, flag2In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145/WA | RP_SIZE ; \ | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | b/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ arrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_groupier(_by_group)(); | ^~~~~~~~~~~~~~~~~~ ;/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | co nst int w| = thread ^~~~~~~~~~~~~~~~~~Idx.x/WAR P_SIZE; \/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h | ^ :29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: Lo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int biwarning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ d = ncIn file included from c/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ lShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | In file included from barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' In file included from 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145int32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZEIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: ; \ unused variable 'w' [-Wunused-variable]| ^ 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15:218::15: warning: unused variable 'bid' [-Wunused-variable] 218 | warning: conunused variable 'bid' [-Wunused-variable]st int bid = ncclShmem.218channe | lId - work->c hannel Lo; | ^~~ const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h.channelId - work->channelLo; | ^~~ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670In file included from :15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.ht:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), DevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLEIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/si]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | zeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthread/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWos), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ rkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1101. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 63%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().r,u n(RteiddOp,, sPurbottno,, wCoOrLkL)_;U N R| O ^L L>(tid, nt/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpph:r17e:a1d:s ,note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested herew ork); | ^ 17 | DEFINE_ncclDevFun/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hc(:A432l:l78R:e note: din instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested hereu ce_TREE_SI M432P | L E _ P r o di_fb f(1t6i_d4 ,< nscucbltFnu)n cRAulnlWRoerdkuCcoel,l (N)C.CrLu_nP(RtOiTdO,_ SsIuMbPtLnE,, w4o)r k )| ;^ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc'/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp :12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here611 | RunWo 12rkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ toSimple<1, 1, COLL_UNROLL>, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthread/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIs(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grou/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreap), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, , nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBl/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINIn file included from E_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hn:c11c: lIn file included from De/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hv:F173u: nc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h(A:l670l:R15e:d uwarning: ceinitializer order does not match the declaration order [-Wreorder-ctor]_ RING_SIMPLE_Prod_bf16_4, ncclFunc Al670l | R e d u ctei,d (Ftuindc)P,r ondt,h rheiapd_sb(fnltoharte1a6d,s )N,C CtLi_dAILnGBOl_oRcIkN(Gt,h rNeCaCdLI_dPxR.OxT)O,_ SgIrMoPuLpE(,g r4o)u p )| ,^ | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_: 611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 671 | 611 | s t e pRSuinzWeo(rsktBeaptScihz.,c oamlmg.ob,u fpfrSoitzoe,s [uNnCrCoLl_lP>R(O)T.Or_uSnI(M)P;L E\] / N| C ^C L_STEPS/s/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hi:z670e:o15f:( Tnote: )field 'nthreads' will be initialized after field 'tidInBlock' : stepSi z670e | _ ) { t i| d ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~( t i| d group(group) , nthreads(nthreads), tidInBlock/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h(:t63h:r56e:a dnote: Idin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested herex .x), gr o63u | p ( g r oPurpi)m,i t i| v ^~~~~~~~~~~~~~~~~e si,d (0t,i dP)r,o tnot,h r0e>a dpsr(inmtsh r e| a ^d s), tid/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hI:n558B:l5o:c knote: (in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested heret hreadI d558x | . x ) , rgurnoRuipn(gg(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_2, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16_4, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1030. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 63%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = nc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:clShmem.channel2: In file included from I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hd - work->channelLo; | ^~~ :75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->ch/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ annelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | st/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h | epSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: :warning: 670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] initializer order does not match the declaration order [-Wreorder-ctor]670 | t 670 | tiid(tid), nthreads(nthread(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ds), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grou 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIM 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here PLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, wor/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ k); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> pri/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ms | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_2, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_ ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8_4, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1101. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 63%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ : warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hIn file included from :173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp: 2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75 :7: warning: unused variable 'w' [-Wunused-variable] uint3 75 | barrie2_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; r_by_gr| oup(); ^~~~~ | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29 :15: note: expanded from macro 'barrier_by_group' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h 29 | const: int w145 = thre:adIdx.28x/WARP_:SIZE; \ | ^ In file included from warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work:218->c:ha15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bnneilLo; d| ^~~ = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->cha:366n:15: warning: nunused variable 'bid' [-Wunused-variable] 366 | e conslt int Lbid = nocclShmem.channelId - work->channelLo; | ^~~ ; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = nIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ cclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ : warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | cIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ onst int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145::28218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ : warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCnote: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LS_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ IMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidIn), BtidInBloclk(threadIodx.x), grcoup(group)k, | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ (threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671671 | s | tepSize(s tepSize_ == 0 ? ncc lShme m.stepSizcoemm.buffSi(zstepSies[NzCCLIn file included from e_ == 0 ? ncc_PROTO_SIlMPLEShmem.comm.buf]f/NCCL_STESPS/sizizeeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp: 2: In file included from | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), s[NCCLn_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h: 254:90: note: 254 | Primiin instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested heret 254 | i Pvthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ rimitivees, /*Op, FanAsDireyct=*/0mmetric,, Pr oto, 0/> prims* | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hD:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here i565 | rect=*/0, Proto runTreeUpDown prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>1,( COLL_tUNROLiL>, COdLL_U,NROL L>(tidn, nthrteads,h worrk); e| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.ha:432:78:d note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here s432 | , i f (tidw < soubtn)r k); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432RunW:orkC78oll, 0, 2, 2>::run' requested here 432 | if (T, tRedOpi, dAlgo, Prot().run(tid, subtn, work)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(thread ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid),tric<1, NCCL_MAX_DEV_ARITY>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Idx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, prIn file included from oto, unroll>/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), ().runn(); \ t | ^ hreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp: | group(group 2/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:: 254:90:In file included from note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h254 | :Primi11tives<: T, RIn file included from edOp,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h FanAs:ymmet173ric, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COL L_UNR OLL>(stid, ntthreaeds, wpork); S | ^ i/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:z78: enote: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here (432 | stepSize_ == 0 ? ncclShmem.comm.buffSizes if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREIn file included from E/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: ,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11 : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175N: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498C:29: Cwarning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] L496 | _ tPid(tRid), nthreOads(TnthOreads_), wSid(tIid%WMARPP_SIZLE)E, 2) | ^ , warp(tid/WARP_SIZE/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:)611:62:, note: expanded from macro 'DEFINE_ncclDevFunc' | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)611 | Run497 | warpInBlock(threadIdx.xWo/rkBaWtchAI, alZgo, Epr), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagToto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nhthrreead((atid%4d)==3s),( gronup(grtoup),h | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~r | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 eads), t idInBlock(threadIdx.x499 | ) , group(gr o suteppSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_ST),E | P ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hS:670:60: /note: sfield 'group' will be initialized after field 'stepSize' izeof(ui n670 | t 6 ti4d(_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.htid), :nth461rea:ds(9nth:rea ds)note: , in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | primtisdIn(Btlocik(tdhre,adI dx.x), nthgroup(group), | ^~~~~~~~~~~ readsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMP/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ LE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grou/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hp(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthr:eads),670 tid:InBlo15ck(t: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | hrea dIdx .x tid(tid), nth), rgroupe(gro | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432upa)ds(nth, r| ^~~~~~~~~~~ea ds), t:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), ntidInBlock(threadIdx.x), group(group), | hreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSizIn file included from e_ == 0 ? nc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ clShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ id(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(groupIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROT/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ O_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_2, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSi/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBloze_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ck(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16_4, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx942. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx908. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 63%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cppIn file included from :1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from 17/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 17 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, f/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const ilag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ nt bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ rier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp::174: 2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hIn file included from :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h75::117: :In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hwarning: :unused variable 'w' [-Wunused-variable]174 : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | b75 | a r r i e r _bbayr_rgierro_ubpy(_)g;r o u| p ^~~~~~~~~~~~~~~~~~( ); | ^~~~~~~~~~~~~~~~~~/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h :29:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hnote: :29expanded from macro 'barrier_by_group': 15: note: expanded from macro 'barrier_by_group' 29 | 29c | on s t icnonts tw i=n tt hwr e=a dtIhdrxe.axd/IWdAxR.Px_/SWIAZREP;_ S\I Z E| ; ^ \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 17 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 17 warnings generated when compiling for gfx1102. [ 64%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROIn file included from T/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ InBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ T, RedOp, Algo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_P).run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid),In file included from nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ ads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_2, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl()./builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hrun(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthrea/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56ds), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32_4, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218In file included from In file included from :15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cppIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LLtid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, workUNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ L_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Op, Algo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: : warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIinitializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/size/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ of(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runT/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hreeU:p670D:o15w:n h,r eCaOdLsL(_nUtNhRrOeLaLd>s()t,i dt,i dnItnhBrleoacdks(,t hwroerak)d;I d x| . ^x ), group(g/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hr:o432:u78p:) ,note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 432 | 671i | f ( t isdt e

().run( ti | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | sd, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(titepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tivef6s4_2, nIT,Y, 1 >, /a*Directl=*/0g, Prooto,, 0> p ripmsr oto, unroll>().ru | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grno(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tupi(gdroup), | ^~~~~~~~~~~~~~~~~I /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:n60: Bnote: field 'group' will be initialized after field 'stepSize' l670 | o tcid(ktid)(, ntthrheads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ readIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(kBnatcth, algoe, protoa, unrdoll>s().run)(); \ ,| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :670:15: note: wfield 'nthreads' will be initialized after field 'tidInBlock' 670 | itidd(tid), n(threatdid%WARP_SIZE), warp(tid/WAs(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hRP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), g:670:60r: note: field 'group' will be initialized after field 'stepSize' 670oup(group), | tid(tid), nthread| s(nthr ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~eads), t idInBlock (thread| Idx.x), warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 gr oup(group), | ^~~~~~~~~~~ 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | 254 | Prim itivest,, /*Dir ect=*/n0, Protto, 0h> primrs | ^ eads(nthreads/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL _UNROLL >(tifd, nthlreads, awgThread((torki); d| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h%:432:78In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : 4note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here )432 | if (=ti=3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | d < sub tn) RunWorkColl().run(tid, subtn, work)stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ; ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cppin instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_nccl461DevFun | c(Al lReduce _TREE_SIMPLE_Sum_f64 _2, ncclFun prims(tcAlilRedudce, Fu,n cnthreadsSplit, treSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | e->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | Ru nWo r kBartcuhS,p alglo, pirotot, (),.r un()R;ed \O p, | ^P ro/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.htoLL128, COLL_UNROL:670L:15>: (note: field 'nthreads' will be initialized after field 'tidInBlock't 670i | d, t indt(thireadd),s nthreads(nthreads), tidInBlock(threadIdx.x), group(grou, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tpi), d| ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h,:670: 60: note: sfield 'group' will be initialized after field 'stepSize' u670 | b ttid(ntid),, nt hrewads(nothrreads), tkidIn)Bloc;k(th r ea| ^dI d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cppx.:5x:),1 :g rnote: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncoup(cgroulp), D | ^~~~~~~~~~~ evFunc(AllReduce_TREE_LL128_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primiti7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthrIn file included from eads(nthreads), tidInBlock(th/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:ves, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 498:29: warning: readIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads),field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 tidIn | Bloc k(thre adId x.x) , grwoup(agrourp), p | ^~~~~~~~~~~ InBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWor611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ kBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]//builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ */0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_2, ncclFuncAllReduce,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | tid(tid), nthrIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColeads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ l().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthrea/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthds), tidInBlorck(threaedIdx.x),a group(grdoup), | s ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671) | st,ep tidInBlock(threaSize(sdtepSize_I == 0dx.x), group( ? nccglShmem.crooup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | mm.buf tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_fSizes [N 671 | C CL_PROTstepSize(stepSize_ =O=_SIMPLE ]/NCCL_STEPS/s0i ? ncclShmem.czeofo(T) : smtmep.buffSiSize_zes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitive) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hs:303:90: note: , FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303T | , Primit ivReesd, /*DiArect=*s/0, ymmetric<1, NCCL_MAX_DEV_ARITY>, /P*roto,D 0>i primrs | ^e /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565c:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here t 565 | = r*unTre/eUp0Down prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreReedOp, PUrotoSimple<1,p 1, DCOLLo_UNROLwL>, nCOLL_U(tid,, nthr eads, work)R;e d | ^O p, ProtoSimple<1, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:1432:78: ,note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | C OLL_UNROLL>, COLL_iUf (tiNd R< suObtn)L RunLW>o(tid, nthreads, rwkCooll, 0, 2, 2>::run' requested here 432 | L_UNROLL>().ru if (tid < subtn) RunWorkColl, 0, 2, 2>::run' requested here A7 | DElFINE_gncclDeovFunc,(AllR educPe_Troto, COLL_UNROLL>()REE_.SIMPrLE_Suum_f64_2, nccn(tid, subtn, wlFuoncAllrReducke,) ; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:FuncSum, dou1ble, :N note: CCin instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(LA_ALlGO_TRlEE, RNCeCL_PRdOTO_uSIMPcLeE_TR, 2) EE_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALG| O^_ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:T611:62: Rnote: expanded from macro 'DEFINE_ncclDevFunc' E 611 | E Run,Wo rkBatcNh, aRlgo,O protoT,O u_nroll>S()I.runM();P LE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: \expanded from macro 'DEFINE_ncclDevFunc' | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :670:15: note: 611field 'nthreads' will be initialized after field 'tidInBlock' | 670 | tRunWorkBatch, alid(tid), nthrego, ads(npthreards), otidtInBlocko, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBloc(kthre(adIdtx.x),h groupr(greoup),a | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hd:670:60I:d note: field 'group' will be initialized after field 'stepSize' x 670 | . tidx(tid)), nth,reads( nthreagds), rtidInoBlocku(threpadIdx(.x)g, grorup(groouupp)), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60, | : ^~~~~~~~~~~ note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ .comm.buffSizes[NCCL_PRO/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h 670 | tiTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:d(ti56d), nth:read s(nthrnote: ein instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | ads), t idInBl o: Primitiv670eck:s(thre15), , 0, Pr | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ o| to, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | note: stepSin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested hereize(step Size_ == 0 ?558 | ru nncclShmeRming(tid, nthmreadse, wo/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ rkm); . | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hc:432o:78: note: min instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here m432 | L_ST. EPS/b sizu eof(f T) :f stieSpSfizie_) z{ (| es ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | [t group(group Nid /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hC<: Csubtn) RunWorkColl, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here, 303 | R PerimitdivesL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ().run(tid, subtn, work);CCL_MAX_DEV_ARITY>, /*Direct=* | / ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp0:12, P:1:r note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here o 12t | DEFIoNE, 0_> npcclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_2, ncclFuncAllReduce, Funrimsc | S ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:u5: mnote: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here ,565 | d ruonTrueeUbpDolwn, COLL_UNROCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ LL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:), | ~~~~~~~~~~~~~~~~~~15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | ing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL _tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumCOLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncc_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ lDevFunc(AllReduce_RING_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work)In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h; | ^:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL12 /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid <8, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncA:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTOllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run_SIMPLE]/(NCCL_)STEPS/sizeof(T;) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitiv/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ es, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads),/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffS tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ izes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, su/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPSbtn, work); /sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto if (tid < subtn) RunWorkColl prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threa/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group dIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllRe:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid)duce_RING_LL128_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62:, nth note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ reads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthrea 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ d:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCLs), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : st_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5epSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h558 | runRing(t: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:22:1to:, CO LL_UNROnote: LL>().in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested hererun(t id, subtn, work)22; | ^ | D/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:22:1E: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here F22 | DEFINIE_ncclNDevFuncE(All_Reduce_nRING_cSIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidty>, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreaInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64_4, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx906. 21 warnings generated when compiling for gfx942. 21 warnings generated when compiling for gfx90a. [ 66%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 29 | const int w = t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ hreadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const i/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const inntt w = threadIbdx.ix/WdAR P_SI=ZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = In file included from ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable]/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gro), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ up), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLEIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(st]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670 :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h15:611:62:: note: expanded from macro 'DEFINE_ncclDevFunc' warning: 611 | initializer order does not match the declaration order [-Wreorder-ctor] RunW orkBa670tc | h,d al(gto,i proto, unroll>d().run(); \ | ^ ), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlo/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hck(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gro note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ up), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:id), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(thread/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, wIordkx).;x ) , | g ^r oup(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSiz/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cppe:_17 :=1=: 0note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here? ncclShmem .17c | oDmEmF.INbEu_fnfcScilzDeesv[FNuCnCcL(_APlRlORTeOd_uScIeM_PTLREE]E/_NSCICMLP_LSET_ESPuSm/_sfi8z_e4,o fn(cTc)l F:u nsctAelplSRiezdeu_c)e ,{ F u| n ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~c S u| m group(group, rccl_float8, NCCL_ALG/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hO:_63T:R56E:E ,note: Nin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested hereC CL_PROT O63_ | S I M P LPEr,i m4i)t i | v^e s , R0u, nPWroortkoB,a t0c>h :,5 : alnote: gin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested hereo , pro t558o | , u n rroulnlR>i(n)g.note: (field 'nthreads' will be initialized after field 'tidInBlock't id, nthr e670a | d s , wtoirdk()t;i d | ) ^, nthreads/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h(:n432th:r78e:a dnote: sin instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here) , tidInB l432o | c k ( t h r eiafd I(dtxi.dx )<, sgurbotunp)( gRruonuWpo)r,k Co l| ^~~~~~~~~~~~~~~~~l e(a)d.sr(unnt(htrieda,d ss)u,b ttni,d IwnoBrlko)c;k ( | t ^h readIdx.x/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp):,12 :g1r:o unote: pin instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here (group), | 12 ^~~~~~~~~~~ | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_2, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlo/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tick(threadIdx.x), group(group), | ^~~~~~~~~~~ dInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8_4, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx942. [ 66%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ .channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | b:a11rr: iIn file included from e/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hr:_175b: y_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.hg:r80o:u5p:( )warning: ;unused variable 'w' [-Wunused-variable] | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: 80note: | expanded from macro 'barrier_by_group' ba r29r | i e r _ bcyo_ngsrto uipn(t) ;w =| ^~~~~~~~~~~~~~~~~~t hreadIdx/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h.:x29/:W15A:R Pnote: _expanded from macro 'barrier_by_group'S IZE; \ 29 | | ^ const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: :366:15:unused variable 'bid' [-Wunused-variable] warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncA tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ llReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid:670:15(: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | t tid(tiid), ndthreads()nthreads,), tidIn Block(thrneadIdxthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ .x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2 : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthre stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] RedOp, Proto, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (t670i | d < s tuibdt(nt)i dR)u,nW onrtkhCroelaldr(o)u.pr(ugnr(otuipd),, s u| b ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~t n ,| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_w ork); | ^ 671 | ste/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cppp:S12i:z1e:( snote: tin instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested heree pSize_ == 0 12? | DnEcFcINlESh_mnecmcl.DceovmFmu.nbcu(fAflSliRzeedsu[cNeCC_LR_INPGR_OSTIOM_PSLIEM_PSLuEm]_/uN3C2C_L2_,S TnEcPcSl/FsuinzceAolfl(RTe)d u:c es,t eFpuSniczSeu_m), { u i| n ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~t 3 2| group(group_ t, NCCL_ALGO_RING, NCCL_PROTO_S/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hI:M303PL:E90,: 2note: )in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here | ^ 303 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h : 611 : 62 :P rnote: iexpanded from macro 'DEFINE_ncclDevFunc'm itives <611T | , R e d ROup,n WForaknBAastymcmheV,_ AaRlIgToY,> ,p r/o*tDoi,r eucntr=o*l/l0>,( )P.rroutno(,) ;0 >\ p r| i ^m s | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h::565670::515:: note: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested herefield 'nthreads' will be initialized after field 'tidInBlock' 565 | 670 | tid(tid), nthread s (rnutnhTrreeaedUsp)D,o wtni, COLgLr_oUuNpR(OgLrLo>u(pt)i,d , | n ^~~~~~~~~~~~~~~~~t hreads/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h,: 670w:o60r:k )note: ;field 'group' will be initialized after field 'stepSize' | ^ 670 | tid/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h(:t432i:d78):, note: nin instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested heret hreads(n t432h | r e a d s ) ,i ft id(ItniBdl o().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] : 670 | t670id(tid),: nthread15s(nthread:s), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_2, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ k(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(ste/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hpSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | , nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32_4, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1200. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 67%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp 21 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_gr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ oup(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmeIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29m.channelId - work->channelLo; | ^~~ :15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - wIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ ork->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , RedOp, Algo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, un/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),roll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, wo/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ rk); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(, tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllRedsteupSizec(setepS_ize_ T== 0R ? ncEclSE_SIMPLhmEem.co_mmS.ubmuf_u6fSi4zes[_N4C,CL_ PnROcTclOF_SuncAllReduce, FuncSum, uint64_t, NCCLIM_PLEA]/NCCLL_STGEPS/Osizeof_(T) : stepSizTe_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ RE | E group(group, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h NCC:254L:_90:P ROTO_note: Sin instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254I | Primitives, algo, proto, unroll>N(CCL_)MAX_.DEV_rARITuY, 1>n, /*(D)irec;t=*/0 , P\roto , 0 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h> prims :670:15: | ^note: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hfield 'nthreads' will be initialized after field 'tidInBlock':565:5 : 670note: | in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565t | id ( trid), nthreads(ntunThreeUrpDowen, COLL_UNROLL>(tid, nthreads, work); | ^ Idx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h| :432:78 ^~~~~~~~~~~: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] | ^ 670/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' | 670 | ti d(t idt), inthredads((nthrteadsi), tdidIn)Bloc,k(th reandIdxt.x)h,r eagdrsoup(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670(:nthr60eads:), note: field 'group' will be initialized after field 'stepSize' 670 | t id InBltock(tihreadIddx.(x), tgrid), nthreads(nthreadsoup()grou, p)t, | i ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ d| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ I671 | nBlock(thread stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSizeIdx.x), group(group), | ^~~~~~~~~~~ _) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSiz/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.he:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ s[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h558 | runRings(nthr)(eads,), tidInBltock(threiadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncc lnthreads(nthreSads), htidInBmlock(ethreadIdmx.x), g.roup(gcrouopmm.buffSizes[NCCL)_, | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ d, =nthre=ads, work)0; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h?:432: 78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here n 432 | cif (ticd < slubtSn) RunhWorkCmoll()b.runu(tPROfiTO_SfdIM,SPLE] i/szNCCuLe_STEbsPS/st[izeonNf(T,C) : CsL t_weoPpROTO_rkS); SIi| ze_ ^) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_2, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | MPLE]/NCCL_STEPS/ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpps:22:1: inote: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here z22 | DEFeINE_nocclDevFunf(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hc:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | (A565llR:educe5_RING tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buff:_SIMPL E_Sumnote: _u64in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here_4, n cclFun cAllReducSizes[NC565C | L_ P R O TrOu_nSTIrMePeLUEp]D/oNwCnC, COLL_UNROLL>(tid, nthreads/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h,: 254wo:r90k:) ;note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here | ^ 254 | Prim/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hi:432t:iv78:es note: , 0, 2, 4>::run' requested hereT, RedOp, Fa432 | n A sy m m e tirfi c(l,l /<*FDni,r eTc,t =R*e/d0O,p ,P rAoltgoo,, 0P>r optroi,m sC O | L ^L _UNROLL>/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h(:)565.:r5u:n (note: tin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested herei d, subt n565, | w o r kr)u;n T r| e ^e UpDown, 0, 2, 4>::run' requested heret oSimple<1, 171 | ,D ECFOILNLE__UnNcRcOlLDLe>v,F CuOnLcL(_AUlNlRROeLdLu>c(et_iTdR,E En_tShIrMePaLdEs_,S uwmo_ruk6)4;_ 4 ,| ^ ncclFuncAllR/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.he:d432u:c78e:, note: Fin instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested hereu ncSum, u i432n | t 6 4 _ t , iNfC C(Lt_iAdL ( | ) . r u nR(utniWdo,r ksBuabttcnh,< cwoolrlk,) ;t y ,| ^r edop,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp :a17l:g1o:, note: pin instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested herer oto, unrol l17> | (D).run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ e, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock'/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (ti 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ d < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffS/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: iinitializer order does not match the declaration order [-Wreorder-ctor]zes[NCCL _PROTO_S IMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_A | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h(:611:62: )note: expanded from macro 'DEFINE_ncclDevFunc' 611 | . RunWrorkBatuch, aligo, prodto, un,roll>() .run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:s15: note: field 'nthreads' will be initialized after field 'tidInBlock' ubtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp670 | tid(tid), nthreads(nthreads):22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64, ti_dItnBl,ock(th readINdx.x)C, groCup(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60L: note: field 'group' will be initialized after field 'stepSize' _ 670 | A tid(Ltid),G nthOreads_(nthrReads)I, tNiGdI, nNBlCoCckL_(PthRrOeTaOdI_SdIx.MxP)LE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' , 611gro | up(g roup), | ^~~~~~~~~~~ RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hd, subtn, work); :670:15: warning: | initializer order does not match the declaration order [-Wreorder-ctor] ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 670 | tid(tid), nthreads(nthre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ads), t | DEFINE_ncclDevF/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hunc(AllRed:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] uc 670 | tid(tid), e_RING_nthreads(nthSIMPLEreads), tidInBlock(threadIdx.x), gr_Sum_u64_4oup(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (stRepSIize_ N== 0 G? ncc,lSh mem.cNoCmmCL.b_PRuOTO_ffSizesS[INMCCPLL_EP, 4)RO TO_S | IM^ P/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hLE]:/611:NC62:C L_note: Sexpanded from macro 'DEFINE_ncclDevFunc' T EPS611/ | sizeof(T) : stepSize_) { RunWorkBatch, algo, proto, unroll> | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ ( | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h):63.:56:r note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here u63 | n P(rimi)tive;st, 0,i Prod(tid)to, 0> p,rim sn t | hr ^ eads(nthreads), tidInBlock(thre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558a:5: note: din instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here I558 | d ruxnRin.g(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested herefield 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64_4, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx908. [ 67%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_grdata2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ oup(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclSIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ hmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ lShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hnote: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), g/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAroup(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ llReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(t:i670d:)15,: nwarning: thinitializer order does not match the declaration order [-Wreorder-ctor]r eads(nthreads), tid I670n | B lo c k (ttihdr(etaiddI)d,x .nxt)h,r egardosu(pn(tghrroeuadps)),, t| i ^~~~~~~~~~~~~~~~~d InBl/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.ho:670c:k60(:th note: rfield 'group' will be initialized after field 'stepSize'e adIdx.x )670, | g r o utipd((gtriodu)p,) ,n t h| r ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~e a d| s tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_( nthreads) ,671 | t i d I nsBtleopcSki(zteh(rsetaedpISdixz.ex_) ,= =g r0o u?p (ngcrcoluSph)m,em . | c ^~~~~~~~~~~o mm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : st/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ CCL_MAX_DEV_ARITY, 1>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] oup(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShm/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oup(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ em.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | lDev Func(All ruReduce_RING_LL128_nRSing, algo, proto, unroll>().run(); \ | ^ Proto, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_2, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_ R22I | NDGE,F INNCEC_Ln_cPcROlTDOe_vSFIuMnPcL(EA,l l2R)e d u| c^e _RING_S/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hI:M611P:L62E:_ note: Sexpanded from macro 'DEFINE_ncclDevFunc'u m_u8_4 ,611 | n c c l FRuunncWAolrlkRBeadtucche<,c oFluln,c tSyu,m ,r eudionpt<8t_yt>,, NaClCgLo_,A LpGrOo_tRoI,N uGn,r oNlClC>L(_)P.RrOuTnO(_)S;I M\P L E| , ^ 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ninitializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: cclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | field 'group' will be initialized after field 'stepSize' 670 | t RunWorkBatch, algo,id(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grou pp)r,o t o| , ^~~~~~~~~~~ unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8_4, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1200. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 67%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hSIZE; \ | :27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: In file included from unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp: 2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:warning: 11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: unused variable 'bid' [-Wunused-variable] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145: 14: warning: 218 | const int bunused variable 'data1' [-Wunused-variable] i145 | d uint3 =2_t dat a1, fnlag1,c data2c, fllag2; S | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:h145:21: warning: munused variable 'flag1' [-Wunused-variable] 145 | e uinmt32_t .data1,c flag1,h data2a,nnelId - wor flakg2; -| ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h>:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flachannelLo; | ^~~ g1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h uint32_t data1, flag1, data2, flag2; | ^~~~~ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hunused variable 'data1' [-Wunused-variable]:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | 145 | co ns uit innt32_t datat bid =1 nccl, flShmem.channelIag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, dda ta2- wo,rk->channelL o; | ^~~ flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(In file included from )/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ; | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - worIn file included from k/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelL:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from o; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ uint32_t data1, flag1, daIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ta2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ 15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) runTreeU 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ pDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15clShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiPROTO_SIMPLE]/NCCL_STEPS/v_i32_2, sncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PRizeof(T) : stepSize_OTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInB/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_Slock(threadIdx.x), gTEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREroup(group), | ^~~~~~~~~~~ E, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | :670:15: swarning: initializer order does not match the declaration order [-Wreorder-ctor] t670 | etid(tidp), nthSreads(inthreadzs), tideInBloc(k(threasdIdx.x), gtroup(egroup), p | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ S 671 | i stze_ == 0 ?epS ize(stenpScclShmem.ize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLcomm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | PrE]/NCCiL_STEPSm/sizieof(T) :t stepSiize_) {v | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(groupe /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:s90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here <303 | T , RedOp, FanAsyPrimitmives, /*Direct=*/_MAX_0DEV_ARIT,Y>, /*D Pirect=*/0, Proto, 0In file included from > prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: 5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid),roto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p, ProtoSimple<1, 1, COLL_UNROLL>, COLL_UNROLL>(tid, nthread nthsread,s(nt hreawdso), tridInkBloc)k(thr;eadI dx.x ), g| roup ^(grou p)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (t, i| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | d tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | < st epSizes(steupSizbe_ =t=n) Ru 0 ? ncclShmem.comm.buffSizes[NCCL_PROTOnWork_CollSP().Srun/sizeof(T) : stepS(itid,z subetn, _work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_)2 { | , ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h: 254:90: nnote: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here c254 | c l PriFmitiuves, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: nin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested herecSum Post Div, int56532_t | , N CCL_A LGO_ TREE , NCrCL_PuROTOnT_SreeUpDown, algo, proto, unroll>im(ple)<1,. 1,r COLun(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' L_U NROL670L>, | CO LL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColladI(dx.).run(tidx),, gr oups(gruobtn, woup), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tirdk);I | n ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cppB:l7:1o: note: cin instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here k7 | (DEthreadIdx.x), group(group),F INE _nc| clD ^~~~~~~~~~~evF unc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreadIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), ts(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ idInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h, nthreads, wo:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] rk); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h670:432 | tid(tid), nth:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().rmun(tid,m subt.n, workb); | ^u /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cppf:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DfEFINE_nSccizes[NClDevCFuncL_PROTO_SIMPLE]/NCCL(Al_lReduceS_TREE_TSIMPLE_ESuPS/sizeof(T)mPostDi v_i32:_2, n stepSize_) {cclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_A | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllRe_DEV_ARITY>, /*Direct=*/0, Proto, 0> prLGO_iTREmE, NCsCL_P ROTO _SI| MPLE, ^ 2 ) | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62:: note: expanded from macro 'DEFINE_ncclDevFunc' 565 611 | : R5unW:orkB adtuce_TREE_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ note: ch, ProtoSimple<1, 1, 2>, 2>' requested hereoll, ty, redo p, 565algo | , pr oto, u n rrunTreeUpDown()r.runo(); t\ | o ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hS:670:15i: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), mple<1, 1, COLL_UNROLL>, COLL_UNROLL>(tid, nthrea/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hds, work); :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | t| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hi:432d:78: (note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here t432 | i dif ()tid ,< sub/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tn) tiRdnIutnBnlhocWkr(oethrakdresCaod(Idxl.nx)l,t g().run(tid, subtn, wor tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ roup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? nk);c | ^c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:l7:1: Snote: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here h7 | DmEFINeE_mncc.lDevFcunc(oAmm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stellRpeducSe_TREiE_SIzMPLeE_Sum_Post)Div_ i32_{2, n cclF uncA| llRe ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~duce , F unc| SumP group(groupost Div/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h, in:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested heret3 2_ t, NCC63 | PrimitivesL_A, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRingedo(p,i aldgo,, pr oton, utnrohll>().rrun()e; \a d| ^s /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h,:670:15 : work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tidi(tfid ), (nthtreaids(dnth rea().run(tid, su b/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | In file included from Run/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(WorkBtatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthrd), enthreaads(ntdhreadss)(nthreads), tidInBlock(threadIdx.x, t)idIn,Block (threagdIdx.rx), group(grooupu), p| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ (group | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ ) 671 | , | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' stepSize(stepSize_ == 0 ? ncclShmem.comm.buf670 | f tidS(tid)i, nthzreads(enthsreads),[ NCCL_PROTO_SIMPLEtidI]nBloc/k(thNreadICdxCL_STEPS/sizeof(T) : st.x), group(group), | ^~~~~~~~~~~ epSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, wo, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreardk); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direck(threadIdx.x), group(group), | ^~~~~~~~~~~ ty>, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here t=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ le<1, 1, COLL_UNROLL>, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PRO) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, TO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(thr:e670:15: warning: ainitializer order does not match the declaration order [-Wreorder-ctor] 670d | tIid(tidd), nthxreads.x)(nthre,a grouds),p t(gridInoup), | ^~~~~~~~~~~ Block(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl()to, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h.run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(thr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.headIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(g:670:15: rwarning: initializer order does not match the declaration order [-Wreorder-ctor] o670 | utid(tipd), n)threa,ds(nth | ^~~~~~~~~~~ reads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | run/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nTreteUpDownh, ,COLL_ UNROLtL>(tiid, ntdhreadIs, wornk); B| ^ l/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:ock(th432:78: rnote: eain instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here d432Idx.x), group(group | ) if, (tid < su btn) | Ru ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ nWor| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ kColl(().runT(tid,) subt n, wo:rk); | ^s /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:t17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFIeNE_nccplDeSvFize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5:O_ SIMnote: PLEin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here, 4 ) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h565:611: | 62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | runTreeUpDown,O alLgo,L pr_otoU, uNnrROLL>, COLL_UNROLL>(tid, nthreads, worko)ll>;(). run ();| \ ^ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' : 670432 | : 78ti:d(tid), nthreads(nthreads), tidInBlock(threadIdx. note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17::1 note: :field 'group' will be initialized after field 'stepSize' note: 670 | in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here tid (tid),17 nt | hrDeaEds(nFthrIeadNs),E ti_dInnBlocck(cthrleadDIdxe.x)v, :Fg670:ur15:no warning: cuinitializer order does not match the declaration order [-Wreorder-ctor] (p A(670gl | lr oR uteipdd()uti,cd) e, n_t| hT ^~~~~~~~~~~R reEE_SIMPLE_SumPostDiv_i3ads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(step2_S4, incclzFunecAl_lRe duc=e, =Fun cSum0Pos tDi?v, i nt3n2_tc, NcCCLl_ALSGhmeOm_TR.comm.buffSizes[NCCL_PROTO_SIMPLEEE,] NC/CL_NPROCTO_CSIMPLLE,_ 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch: s,tep Sizae_)l { g | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ o | group(group, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h :254:90: pnote: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here r254ot | o , unroll>().run(); \ Primitives, /*Direct=*/0, Proto, 0> prims : 15:| note: field 'nthreads' will be initialized after field 'tidInBlock' ^ 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h tid(:tid565), :nth5rea:ds( nthnote: readin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested heres), ti dInBl565oc | k(t hrea dId x.x ), rgruoupn(grToup), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreadreseU)pDo,wn< T, tRediOp,d PrIotoSnimpBle<1l, 1o, CcOLLk_UN(ROLLt>, hCOLrL_UeNadIdx.x), group(gROLL>(tid, nthreadrso,u pw)o,r k )| ; ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h tid(tid), nthreads(nthread:670:15:s warning: initializer order does not match the declaration order [-Wreorder-ctor] )670 | , tid (tid),t ntidInBlock(threadIdx.x), grouphreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | s(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(thread/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, workIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ ==); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 0 ? ncclIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tiShmdem.comm.bu)ffSizes[N,CCL_PROTO_ SIMPLE]/NnCCL_STEPS/tsizeof(T)h rea: stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> primds(nthsreads), wid(tid%W ARP_SIZE)| , warp(tid ^/WARP_SIZ E), | ~~~~~~~~~~~~~~~~~~/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInB:lock(thre558adIdx.x/:WARP_SIZE5), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here | warp(tid/WARP_SIZE 498 | flagThread((tid%4)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunW, NCCL_MAX_DEV_ARITY>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), orkCol | l stepS().run(tiof(uidnt64_t),) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hs:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0ub> prtn,i workm); s| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp | ^ :22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFunc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062A:5: lnote: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here l1062Re | d urunRcing(3tid, 2nth_ret, NCCL_ALGO_RINGa,ds, workN); C | ^ C/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432L:_PROTO_SIMPLE, 4)78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBl>().orun(ctid,k sub(tn, twork); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpph:10:r1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested heree a10 | DEdFINE_InccldDevFxunc(.AlxlRed)uce_,RING _LL1g28_SurmPosotDivu_i32p_2, (ncclgFunroucAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_Pp),R | O ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hT:670:O60: note: _field 'group' will be initialized after field 'stepSize' L670 | L 1 tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 28, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, wo:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.commrk); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here .buffS 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ izes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested hererunTreeUpDown, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ RedOp, ProtoSimple<1, 1, COLL_UNROLL>, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(thre if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ adIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx908. 21 warnings generated when compiling for gfx942. 21 warnings generated when compiling for gfx90a. [ 67%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint3In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 2_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdxIn file included from .x/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | bar/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75rier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threa:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ dIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t dataIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx1, flag1, data2, flag2; | ^~~~~ In file included from .x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); :| 174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145: ^~~~~~~~~~~~~~~~~~14: warning: unused variable 'data1' [-Wunused-variable] 145 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h uint32_:t dat29a1, f:lag1, 15data2,: flag2 ; | ^~~~~ note: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21:expanded from macro 'barrier_by_group' warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t 29data | const int w = threadIdx.x/WARP_SIZE; \ 1| , fla ^g1, data2,In file included from flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint3In file included from 2_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28In file included from : warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp: warning: unused variable 'w' [-Wunused-variable] :75 | 2 ba: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] rrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = thr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: eadIdx.x/WARP_SIZE; \ | ^ warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t:218 :15: warning: dunused variable 'bid' [-Wunused-variable] 218a | t coIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_groupnast int(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ bid1 = n,cclS hmemIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hf.:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ lag1, data2, flag2; c hannelId | - wo ^~~~~rk-> chan/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hnelLo; | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] :145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | c/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | coonst int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | nst int w = threadId145x | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ .x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h barrier:218:_15: warning: bunused variable 'bid' [-Wunused-variable] y218 | _ cognst rint obid u= ncpclS(hmem).cha;nnel Id - wor| k->c ^~~~~~~~~~~~~~~~~~hann elLo/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = In file included from threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2:218:: 15: warning: In file included from unused variable 'bid' [-Wunused-variable] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h218 | : co11nst int bi: d = In file included from nccl/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hShme:m.c:174h366:15: a: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hwarning: unused variable 'bid' [-Wunused-variable]n: n 145366 | e: 14 con:lst Iinwarning: td bunused variable 'data1' [-Wunused-variable]i d =- n c145 | uint32_t dawork->channelLo; | ^~~ clShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ ta1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t da/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ ta1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ , flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - worIn file included from k->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15 | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h::29:15: note: expanded from macro 'barrier_by_group' 29 | warning: const int w = threadIdx.x/WARP_SIZE; \ | ^ unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | cIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.honst int bid = ncc:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ lShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreIn file included from eSplit(tid, nthrea, dtidInBlsock(threa,dIdx .x), gwroup(groouprk);), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work);| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671oSimple<1, 1, COLL_UNROLL | stepS>, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(groize(ste| pSiz ^e_ == 0 ? ncc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpplShmem.comm.b:uffSi5zes[N:CCL_P1ROTO_:SIMPL E]/NCnote: CL_Sin instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested hereTEPS/ size of(T) : st5epSup), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ i | ze_D) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group E/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: Fin instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here gIr254oupN) | , E | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671_ | st epnSi zec(sPtecpSrizle_i =D= m0 ?e inccvFunc(Altilves, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested hereostD iv, anAsiym303mne | trit cC,i /C*DmiLreic_t=t*A/0iL, PrGotovO, 0e_> psTrim, ProtoSimple<1, 1, 2>, 2>' requested here d565 | ON prCunTCreeL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611UpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreadsoll, ty, redop, algo, proto, unroll>().run(); \ | ^ ), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreadsizes)[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree-In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ >down, tree->down, work->sendbuff, work->recvbuff, work->redO, tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ pArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | [NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, wRounWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ rk->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ T, RedOp, Algo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.he_TREE_S:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ IMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSu/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), ntmPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(hreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().r,un(tid , subgtn, wrork);o | ^ u/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cppp:7:1(: note: grin instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here o up), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | 7 tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ | DEF 671 | stepINE_nScclDeviFunc(AzllRedeuce_TREE_SIMPL(E_SusmPtosteDiv_ip64S_2i, nze_ == 0 cclFu?ncA lncclReduce, FuncSumPostDiv, int64_t, NCCL_ALlShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | PriGO_TRmEE, iNCCL_PROTOt_SIMiPLE, v2) | e^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' s 611 | _, aDlgoE, pVrot_o, uAnroRll>I().Trun(Y); >\ ,| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/:*670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tidD(iretcti=*d/0,), nthreads (Pronto, t0> hprireads), tidInBms | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, ind(ttidh), rnthereaadsd(ntshr,ea dws),o tidInBlorck(kthre); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | adIdx.x), group(group), | ^~~~~~~~~~~ if (tid < subtn) RunWorkColl, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl()o, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_.run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid/WARP_SIZE), tid(tid| ), nthreads(nthreads), tidInBlock(thre ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~adId x.x), g roup(grou| p), | warp(tid/WARP_SIZE ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof( 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~T) : stepSiz e_) { | | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group group(group/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h | Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | , NCCL_MAX_ DEV_ARITY>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpPrimitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: Dowin instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested heren, CO LL_UN ROLL> (tid, inthrefads, work)(; | ^t /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hi:d 432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Op, Algo, Proto, COLL< subtn_) RUunNWorRkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10OLL | >().Drun(tEid, FsubtINE_n,n workc); c | l ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1D: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested heree vF 7un | c(AllReduce_RING_LL128_SumPostDiv_i64_2, ncclFunDEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPocAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ stDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] , NCCL_PROT O670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL12/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group)8, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | , ^ | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ lock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_R:670:I15: warning: initializer order does not match the declaration order [-Wreorder-ctor] N670 | Gtid(tid_), nthrSeads(nthIreads),M tidInBlPock(thrLeadIdx.Ex), grou_p(groupS), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ u | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671m | stePpSize(sotepSize_s == 0 ?t ncclSDhmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatcEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ h, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ roll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subt/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) Rn) RunWorkColl()unWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ .run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | cclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Di=rect=*/0, Proto, 00> prims | ^ ?/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | n runTcreeUpDowcn, COLL_UNROLL>(tid, nthreads, work); | ^ROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, 0, 2, 4>::run' requested here _432 | M if (tAid < sXubtn) _RunWorDkColl().rYun(tid,, subtn , work1); | ^>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:56517:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:Su78mPo:stD iv_inote: 64_4in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here, n cclF uncAllRe432duce | , Fun cSum Post Div, int6 4_t, NCCiL_AfLGO_ TREE(, NCtCL_PROTO_SIMPiLE, d4) | ^ , algo, proto, unroll>lgo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclF().run();u \ n | ^c A/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:l670:15l: note: field 'nthreads' will be initialized after field 'tidInBlock'R e670d | u tcid(etid,), nthFreauds(nnthrceadSs),u timdInPBloock(sthrteadDIdxi.x),v gr,oup (grioupn), t| ^~~~~~~~~~~~~~~~~ 6/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60:4 note: field 'group' will be initialized after field 'stepSize'_ t670 | , tiNd(tid), nthreads(nthreads), tidInBlock(threadIdx.CCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().runx), gr(ou)p(;gr ou\p) , | ^~~~~~~~~~~| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 1, COLL_UNROLL>, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | P/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.cormimitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ m.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBloc(tikd < su(btn) RtunWorkhColl(x).run(.tid, sxubtn), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | st, worek); p| ^ S/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1i: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here z17 | DEFINEe_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncc(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ lFunc AllRe| duce, group(groupFuncS umP/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hostDiv, int64:_t, N303CCL_A:LGO_T90RE: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670ITY>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:22:1:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevF/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670unc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1102. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 68%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, dat/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.ca2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ hannelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable]In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174In file included from : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, dat/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cppa2, fl:ag2; | 2 ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28:: warning: unused variable 'data2' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | uinbt32_t daata1, flarg1, data2,r flag2; ier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ flag1, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | constIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelI consdt int w = thre-adIdx.x /WA/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cppRP_SwI:ZE; o\ 2 | ^ r: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | conk->chasnnelLot; | ^~~ int bid =:366:15: warning: unused variable 'bid' [-Wunused-variable] ncclShme366m.chann | elId - work->c hanne lLo; | ^~~ const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.chanIn file included from nelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 | ? flagThr ead((tid%4n)==3), grcoup(groupc), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~l | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | S stepSihze(ncclShmem.comm.bumffSizes[NCCLe_PROTO_LmL128]/NCCL._STEPS/comm.buffSizes[NCCL_PRsizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | OTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitivesdo8Y_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, wn, tree->down, wor,k-NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ >sen dbuff,1 work->>recvbu,ff, work ->redOpA/rg); | * ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:D1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here irect=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h 1070 | runTreeSplit(tid, nthre:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nads, tworhk); r| ^ e/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:a78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested hered 432 | s , if ( tid < wsubotn) RrunWork); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tidk Coll<( ).rRunWoun(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:5:1: rkColnote: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ l().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclSShIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ mem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hIn file included from :432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINhreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ E_ncclD671evFunc | (All Reduc e_TRE E_SI MPLE_sSumPotstDive_i8_pSize(step2S, nccilFunczAle_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(lReduce, FuncSumPostDiv, int8_t, T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0 ,Run WorkPBatrch prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here y >, alg565o, | p rot o, unro ll>r().urunn();T \ r | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | eeUpDown, COLL_UtidN(RtiOd)L, nLthre>ad(s(nthreadts),i tiddInB,lock (tnhreatdIdhx.xr), egroaupds, work);(gr oup )| , ^| ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h::432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | 670 i:f60: note: (field 'group' will be initialized after field 'stepSize' t i670 | d t().run(tid, subtn, work); | ^gr ou/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cppp(group):, 7 | : ^~~~~~~~~~~ 1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_2, n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | cclFuncAllReduce tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15(:group), | ^~~~~~~~~~~ note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthrea d670 | tisd(tid),( nthreadsn(nthreadts), tidIhn 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Block(trehreadIdx.x), gads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSizeroup(g(roup), s| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ t671/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here | stepSize(stepeSize_ p== Si558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ z0e ? nc_clShme m.== 0 ? ncomm.bcufclShmem.cfSizoes[NCCmm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { S/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives< | T, RedOp, F ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ a| group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hn:303:90A: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here s 303y | m Pmrimiteives, /*YDir>ect=*, /*Direct=*/0, /Proto0, 0> , Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, C | OruLL_UNROLnTLree>UpDo(wn, COrLL_UNkROLL>)(tid,; nth rea ds, wo| rk); ^ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h432:78::432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE,n, T, RedOp, Algo , Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hSIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PR:O670:15: warning: Tinitializer order does not match the declaration order [-Wreorder-ctor] 670 | O ti_d(tid)S, nthrIeads(nMthreadsP), tiLdInBlE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62:ock( threadnote: Idx.xexpanded from macro 'DEFINE_ncclDevFunc'), 611 | group( grRunWorkBatch | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ ,| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | asteplSize(gstepSoize_ ,== prot o0 ?, unro nlcclShlmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCC>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), L_S TEPS/| size ^~~~~~~~~~~~~~~~~of(T) : st/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~: | group(group 670/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h::63:56: 60note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here :63 | Primnote: ifield 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreativeds,d 0, IProtno, 0B> prlimos | c ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hk(thr:558:5e: note: ain instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nth rgroup(greoup), | a ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ d 671 | s stepSi,ze(stepS ize_ ==w 0 ? nocclShmemr.comm.bkuffSizes)[NCCL_PRO;TO_SIMP LE]/NCC L_STEPS| /sizeof ^(T) : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid,:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(All nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReductepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ e_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSuReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ mPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), ti:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : dInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINeadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group E_n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hcclDevFunc(AllReduce_RING_:LL128_63SumPos:tDiv56_i8_2:, note: ncin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here clFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING,63 | NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' Primiti611ves< | T, R edOp, FanSy mmetr ic<1>R, 0, uProto,n 0> pWrims o | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hr:558k:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested hereB 558 | a rtunRingc(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tll, ty, redop, algo, proto, unroll>().run(); \ | ^ id < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h note: field 'nthreads' will be initialized after field 'tidInBlock' :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buf 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threfaSizeds[NCCIL_PRdOTO_xSIMP.LE]/xN)CCL,_ST EgPS/srizeoof(uT)p : (stegpSize_)ro { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90up:), | note: ^~~~~~~~~~~ in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < s ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_ubtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ OTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | r/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | unRi ng(tnid, ntthreadhs, workr); | ^e /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hads(nt:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl), | ( ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) 671 | . strepSizeu(stnepSiz(e_ =tid= 0, subtn, wor ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepk);S | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cppi:12z:1: note: ein instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12_ | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING,) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ N| group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hC:63:56CL:_ note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here P63 | R POrimiTtivOes, ,0, P roto2, 0>) pri ms | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h: 558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid611 | , nthreads, work); | ^ RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hd:)432:78:, note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432n | t ifh (tird < esubtan) RudnWors(nthreads), tidkCoIll().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:22: ^~~~~~~~~~~~~~~~~1 /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h::670 note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING:_60: note: Sfield 'group' will be initialized after field 'stepSize' I670 | M P tLid(Etid_), Snthureads(nthreads), tidInBlock(threadIdx.x), groumPopstDi(v_gi8r_4oup, )nc, | ^~~~~~~~~~~ clFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),17 warnings generated when compiling for host. group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclSh unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | mem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(thread/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Idx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthread ts), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_id(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROT/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:of(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlo15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidI:n670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Block(threadIdx.xck(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffS0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:izes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: 56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Prfield 'group' will be initialized after field 'stepSize'o 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ to, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().r/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hun(tid, subtn:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Pr, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduimitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(thread/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDowIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreand, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17s), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1201. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 68%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:ag2; | ^~~~~ 2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flaIn file included from g2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp::2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h145:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h::175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5:28 warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint3 =2 thre_adIdxt.x/WA RP_SIZE; d\ | a ^ ta1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp: 2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h :27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const intu bid i= ncnclShmtem.ch3ann2e_ltI dd a-ta1, flag1, data2, flag2;In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] work80->cha | nnelL o; | ^~~ barri | ^~~~~e r_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE;/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp: \ | ^ 2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = nccIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ lShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = nc:c218:15: lwarning: unused variable 'bid' [-Wunused-variable] 218S | conhst int bid = nmcclShmeem.chmannelI.d - wcork->chhannelannelId - work->channelLo; L| ^~~ o; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | : 366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ P_SIZE; \ | ^ work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tIn file included from id(tid), nthreads(nthread/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpps), ti:dInBl2ock(threadIdx: .x), In file included from group(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hg:r11: oupIn file included from )/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h, | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthrea:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:d670:s15: warning: initializer order does not match the declaration order [-Wreorder-ctor] (670 | ntid(tid)t, nhthreads(nrthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ ==ea ds), tidI0nBloc ? ncclShmem.comm.buffSizek(thrseadId[x.Nx), group(gCroupC), L | ^~~~~~~~~~~_ PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), In file included from | ^~~~~~~~~~~~~~~~~/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2 : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h::670:15: 670warning: initializer order does not match the declaration order [-Wreorder-ctor] :670 | 60 tid(:tid )note: ,field 'group' will be initialized after field 'stepSize' n t h670 | tid(tid), nthreads(nthreads), tidInBlocrkeads((nthretads),h tidIrnBloceak(thrdeadIdIx.x),d grouxp(gro.upx)),, group(g r| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | o tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ up), 671 | | ^~~~~~~~~~~ stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColld), n(threads)(nthr.eads)r, tidun(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFIInNBlockE(thre_adIdxn.x),c grocup(grloup), D | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ e| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_v 671 | F u stepnSizec(s(tAeplSlReduce_TREE_SIMPLE_izSe_ ==u 0 m? ncclShmem.commPostDiv_u32_2, ncclFuncAllReduce, FuncSumP.buffSizeos[NCsCL_PRtOTO_SDIMPLEi]/vNCCL,_ST Euint32_t, NCCL_ALGO_TREE, NCPS/siCzeof(LT) _: stePpSizeR_) { O | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ T | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hO:254_:90:S Inote: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested hereM P LE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611254 | | P rimit ives< T, RedROp, uFanWorkBatchnAs, aNCCLl_MAXg_DEoV_ARITY,, 1>, /*Dpriroectot,=*/0, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthrea Prodto, s0> p)rims, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.ht:565:5i: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested hered I565n | B l ruonTrceeUpDkown<(T, RtedOph, PrrotoSiemplea,60 COL:L_UN ROLLnote: >(tidfield 'group' will be initialized after field 'stepSize', nt hre ads,670 | wo r k tid(tid), nthreads(nthreads), ti); d | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hI:432n:78: note: Bin instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here l432 | if (tid < suock(threadIdx.x), group(group), | ^~~~~~~~~~~ btn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hnote: field 'group' will be initialized after field 'stepSize':670: 15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gr 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group)oup(group), | ^~~~~~~~~~~ , | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ lgo, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIProto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAldx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ lReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] hreadIdx.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grouIn file included from p), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PRO/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid),TO_S IMPnLE]/NCCLt_STEPS/hsizeofr(T) : setepSize_a) {d | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | s group(group (/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: nnote: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitithreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadves,R /*DirecPt=*/0,_ Proto,S 0> primIs | ^ Z/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5:E note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here) , 565 | | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), grunrTreeUpoDown, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ LL>, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | Op, ProtoLL128, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TRE runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ E_LL128_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*D), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ?irect=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nth/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u3reads(nthreads), tidInBlock(thr2_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), groeadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | up(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grou: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthread/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.cos), mm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeS/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ plit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DIn file included from EFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBa/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBltcho, a(lgo, ptroto, uhnroll>r().ruen(); a\ | ^d /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hI:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock'd 670 | x t.id(tidx), nth/readsW(nthAreadsR), tiPdInBlock(th_reSaIdZEI), dx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->u ptid,(ti d), nthwreads(onthreadrs), tidInBlkock(-threa>dIdxs.x), groeup(gronup), d| ^~~~~~~~~~~ buff, work->recvbuff, work->re:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPdOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, wLoE]/NCrCL_kSTEPS/size)of(T); : ste pSiz e| _) { ^| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here :303 | 432 P:r78i:m itnote: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested herei ve s432< | T, if (tid < RedOsp, FuanAsybmmettric<1n, ) NCCL_MAX_DEV_ARITY>, /*Direct=*/0, Proto, RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u32_2, ncclFuncAl0> lprimRs | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:e5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested hered 565 | u rcunTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) e, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch().rrun(etid, dsubtn,o workp); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:<1: note: ty>,in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7a | lDgo, proto, unroll>().run(); \ | ^EFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAll Reduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h proto, unroll>().run():670:;15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670\ | ti d| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15:(tid), nthreads(nthreads), tidInBlock(threadId note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(ntx.x)h, grorup(egroaup), d | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ s| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | ) s,tepSi ze(sttepSiize_ =d= 0I ? ncnclShmBem.comlm.bouffSiczes[NCkCL_PROTO_SI(MPtLhEreadIdx.x), grou]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254p(group), | ^~~~~~~~~~~ :90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | grou stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)p), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670: 60: note: field 'group' will be initialized after field 'stepSize' 497670 | | ti d(tid), nthre ads(n threa ds), twidInBalock(threadIdx.x), group(group), | ^~~~~~~~~~~ rpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | | ^~~~~~~~~~~~~~~~~tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, w/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unork); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWoroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ rkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run();/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group),:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stegroup(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4 7 | DEFINE_ncclDevFunc(AllReduce_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hTREE_SIM:670:15: Pwarning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | L tiEd(tid),_ nthreaSds(nthrueadsm), PostDiv_u32_2, nc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/clFuncAllR0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ edutidInBlock(threadId, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ x.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatchfSiz,es[NCCL_PRO TO_SIaMPLE]/lgo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_nccl, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ DevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSi:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] ze(stepSize_ == 0 ? ncclShmem.comm.buffSizes 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto 671, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadId | stepSizex.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (stepSiz[NCCeL_PROTO_SIMPLE_]/NCCL_S TEPS/size=of(T) : =stepSize _) { | 0 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h?:63:56 ncclShmem.comm.buffSizes[:N note: Cin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here C63 | L Pri_mitivPes,_S I0M, PProto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558LE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ | runRin/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hg(tid, nthnote: readsin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here, wo rk); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 558432 | | if (tid < s ubtn) RunWorrkColul().run(tid, subtto, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tin, wdork) ; | ^< /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp :22:1s: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested hereu 22 | DEbFINE_tncclnDevFun)c(All ReducRe_RINuGnWo_SIMPLrEk_Colluint32(_)t.,r uNCn(tCid, subL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) tn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv| ,^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h: 611:62: note: uexpanded from macro 'DEFINE_ncclDevFunc' 611i | nRunWotrk3Batch2, ,algo, protoN, unrCollC>().rLun()_; \A | ^ L/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:G15: note: field 'nthreads' will be initialized after field 'tidInBlock'O 670 | _ Rtid(tIid), NnthreGads(,nthre adsN)C, CLt_idPIRnOBlock(threadIdx.x), group(grouTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthrp)e, | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.ha:670:60d: note: field 'group' will be initialized after field 'stepSize' s670 | ( tidn(tid)t, nthrheadrs(nthereads), tidInBalockd(thresadIdx).x), ,gro up(grotup), i | ^~~~~~~~~~~ dInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h17 warnings generated when compiling for host. :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS//builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ symmetric, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx908. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 68%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h | co:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ const int bid = ncclShmem.channelId - work->channelLo; | ^~~ nst int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p, FanAsymmetric, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFIn file included from uncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(t(id), nthreads(ntthreads), tidIniBlock(thdread)Idx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | , nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? nc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | r u nPrTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ imitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15:), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' :670:15 670 | : warning: initializer order does not match the declaration order [-Wreorder-ctor] tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buf/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PRfSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ OTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, su b670t | n , w otrikd)(;t i d| ) ^, nthread/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpps:(17n:t1h:r enote: ain instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested hered s), tidIn B17l | oDcEkF(ItNhEr_enacdcIldDxe.vxF)u,n cg(rAolulpR(egdruocuep_)T,R E E| _ ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~S I M| P tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_L E_SumPos t671D | i v _ u 6s4t_e4p,S inzcec(lsFtuenpcSAilzleR_e d=u=c e0, ?F unncccSluSmhPmoesmt.Dciovm,m .ubiunftf6S4i_zte,s [NNCCCCLL__APLRGOOT_OT_RSEIEM,P LNEC]C/LN_CPCRLO_TSOT_ESPISM/PsLiEz,e o4f)( T )| ^: stepS/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hi:z611e:_62): {note: expanded from macro 'DEFINE_ncclDevFunc' | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 611 | RunWorkBatch/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h<:c63o:l56l:, note: tin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested herey , re d63o | p < t y >P,r iamligtoi,v epsr().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Op, FanSymmetric<1>, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hd%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkCo/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWll().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ orkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSiz:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(thr17 warnings generated when compiling for host. eadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidIn, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Block(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthrea/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1200. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1201. 21 warnings generated when compiling for gfx942. 21 warnings generated when compiling for gfx90a. [ 68%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:: 11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hIn file included from :175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:5: :warning: unused variable 'w' [-Wunused-variable] 8011 | bar: rieIn file included from r_by_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hgroup():; 173 | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:: 29:15: note: expanded from macro 'barrier_by_group'/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h 29 | : 75 con:st i7nt w := threadIdx. warning: unused variable 'w' [-Wunused-variable] 75 | barriex/WARP_SIZE; \ | ^ r_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, In file included from data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp::2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:2111: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h::75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group( warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ); | ^~~~~ ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: 29:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h15: note: expanded from macro 'barrier_by_group' 29: | const int w = 145threadI:dx.x/WAR35P_:SI ZE; \ | ^warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARPIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27_SI | ZE; \ | ^ const int bid = ncclShmem.channelId In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channeIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' l29Id - work->channelLo; | | ^~~ const int w = thread/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIdx.x/WARP_SIZE; \ | ^ In file included from :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrieIn file included from r_by_gro/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: uIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | p uint32_t data1, f(lag1, d); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:ata2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h15: note: expanded from macro 'barrier_by_group' 29 | :145:21 : warning: unused variable 'flag1' [-Wunused-variable] 145 | c uoinnstt int w = 32_t dtata1, hrfeladIdx.x/WARag1P, da_SIta2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | ZE; \ | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2g: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11r: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.ho:175: u/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5p: warning: unused variable 'w' [-Wunused-variable] (80 | ) bar;rier_ by_gr oup(| ); | ^~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15:15 note: expanded from macro 'barrier_by_group' : 29 | conote: nexpanded from macro 'barrier_by_group' 29 | const int st int ww = th rea=dI dx.x/tWAhRrPe_aSdIZIEd; x.x/WARP_SIZE; \ | ^ \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] In file included from 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data uint32_t data1, flag1, data2, flag2; 1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:212: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h::27:15: warning: unused variable 'bid' [-Wunused-variable] warning: 27 | unused variable 'flag1' [-Wunused-variable] con st i145 | uint3nt bid2 = nc_clSt hmdeamtIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ a.channelId - work->chann1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ elLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmemIn file included from .channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h218:80:5: warning: :unused variable 'w' [-Wunused-variable] 1580 | : warning: unused variable 'bid' [-Wunused-variable] 218 | const ba rrier_by_grouipnt bid =(); | ^~~~~~~~~~~~~~~~~~n /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const intcclShmem.channelId - work->channelLo; | ^~~ w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h27 | :366 :15: warning: unused variable 'bid' [-Wunused-variable] const366 | conint bst iintd = nccblid = SncchlSmhemm.emchannelId - work->cha.nchannneelId l- workL-o>;c | ^~~ hannelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h const int w = threadIdx.x/WARP_SIZE; \ | ^ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h: 27:15: cwarning: unused variable 'bid' [-Wunused-variable] 27o | n consts int btid = ncclShmem. channint bielIdd - w =or kn-c>clchanSnhelmLoem; . channelId - work->ch| ^~~ annelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145In file included from :28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ id = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatctidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { h, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFI/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:N2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hE:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h_:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498n:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | c tcid(tidl), nDthreaeds(vnthrFeads)u, wnid(tidc%WARP(_SIZEA), warlp(tidl/WRAeRduce_TREE_SIMPLE_SumPP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | ostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | flaRgThreaud((tind%4)=W=3), ogroupr(groukp), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ B | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | a stetpSizec(ncclShhmem., alg128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here o, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 461 | 670 p | rims (tid, nthre adsSp lit, ttree->idown,d &tree->up,( wotrk->siendbudff, w)ork->r,ecvbu ff, wonrk->rtedOpAhrg, reads(nthread0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work);/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 | ? ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | nDEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:cclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ *Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | :29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Di/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ rect=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, CO 670 | L tid(tLid), n_threadsU(nthreadNs), tidIRnBlock(tOhreadIdLx.x), gLroup(g>rou(p), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~t | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ i671 | d ste,pSize(s tepSizen_ =threads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78= 0 ? nc:clShm em.comm.buffSizes[NCCL_PROTO_SIMPLE]/Nnote: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevCCFL_STEPuS/sizeofn(T) : cstepSi(ze_) A{ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ l | group(group l/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | R Priemitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5:IMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALG Onote: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here _565 | T runTreeUpDownL, _CPORLOLT_UON_RSIOLMLP>LE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ IMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) {/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h | :670: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | | tid group(group(tid) , nthreads(nthreads), tidInBlock(threadIdx.x), g/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hro:u303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | p(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nt/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hhreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPost/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PR/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hOTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, u:670:15: nwarning: initializer order does not match the declaration order [-Wreorder-ctor] r670 | tiod(tid)l, nthrlead>s(nthreads), tidInBloc:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | () ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~.run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock'| 670 | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ tid(tid), nt hreads( nthreads), ti671dInBlo | ck(threadk(thIre adIddx .x),x gro. up(grxsoup), )t | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | e, tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671p | gSsteirpSiozuez(steppSeize((stegproup_S ==) i0 ,? ncc lS hme| m.com ^~~~~~~~~~~~~~~~~m.bzue_ == /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:6700:60:f f Sinote: ze?s[field 'group' will be initialized after field 'stepSize'NC C nL c_c670PR | lS Oh T mO_e tSmIi.comm.bud(tid), nthreads(nthreads)MPLE],/NCCL _STEPtS/sizieof(Td) : stIepSizneB_lo) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303: Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 90:ffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here V303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _ARITY, 1>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tidIn file included from , /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cppn:2: tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hr:670:15e: warning: initializer order does not match the declaration order [-Wreorder-ctor]a d670 | s , w toirdk(t)i;d | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h), nthrea:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | ds(nthreads), tidInBlock(threadIdx.x), group(group) if (tid < subtn) RunWorkColl().run(tid, subt, | n ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | , tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepwSize(osteprSizek_ ==) 0 ?; ncc lShmem. comm| ^.b /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here uffSizes[17NC | CL_PDEFINE_ncclDevFunc(AllReduce_TREE_SIMPLER_OTO_SSIMPuLE]/NmCCL_SPTEPS/sizeof(To) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, t/*Dircecth=*/<0, Pcrotoo, 0>l prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hl:565,:5 : note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested heret 565y | ,run redop, algo, proto, unTrreeUpDown, COLL_UNROollL>().Lrun(>); \ ( | ^t /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:i670:15d: ,note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_)n, tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ cclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] | RunWor 670 | tid(tid), nthreads(nthrkBatch, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work):; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlockLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ note: field 'group' will be initialized after field 'stepSize' 670 | ds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x)cclShmem.comm.buffSizes[NCCL _ tiPd(tidR), nOtThrOea_ds(ntShreaIds), MtidInBlock(PthLE]re/NCCL_STEPS/sadiIdx.zx), egrouop(group),f (T) : ste| ^~~~~~~~~~~ pSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpD, group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSowumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ n, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? d, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> primsTREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | t runRiing(t)id, nth,reads, work)n; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.ht:432:78h: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here re432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclS 611 | hmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PR In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NC RunWorkBads(nthreads), tidInBlock(threadIdx.x), CL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hthreadIdx.x), OTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group(group), | ^~~~~~~~~~~ atch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670::60670:15:: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nth note: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hreads(nthreads), tidInBlockfield 'group' will be initialized after field 'stepSize' ( 670 | t h r tide(taidd), Intdhrxead.s(ntxhr)e,ads ), tgidroInuBplo(gck(rtohup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | r ea:sdI670tdxe:.15px):S, igrwarning: zoinitializer order does not match the declaration order [-Wreorder-ctor]eup ((g sroup),t 670e| ^~~~~~~~~~~ | p Size_ = = ti0d (t? idnc)c, lntShmem.comm.bhreads(nthreaduffSizes[NCCL_PROTO_SIMPLE]/NCs)C, tLidI_nBlSockT(thEreaPdSIdx/.x)s, girouzp(egrooup)f, | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ ( T| ) tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~671 | s| tep group(groupSiz e(s/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.htepSize:_ 63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0C>CL _STpEPSr/sizieofm(Ts) : s| te ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads,pSi zew_) o{ r| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~k )| group(group ;/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303 :90 : note: | in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here ^303 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h P:r432i:mi78tiv:es , 1, 2, 2>::run' requested hereFanA sy mmet432ric<1, | N CC L_M AX_ DE if (tid < subtn) V_RARIuTYn>, W/*Doirrect=k*/0C, Porotlo, l0> , ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUOLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SpuDowmn, CnOLLc_UNcROLlL>(Ftidu, nncthArealdls,R weorkd); u| ^c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.he:,432: 78F: unote: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here n 432 | c S uif (mtidP < subtn)o RusnWotrkCDollir().erund(toidp, surk),; | ^ a/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:l7:1:g note: oin instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here, 7 | DpEFrINEo_tnccloDe,vFun c(AullnRerdoll>u(ce)_TR.EEr_uSIn(M)PLE; _\Su m P| o ^s /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tD iv _u8_ 2, nc clFtunicAld(lRtiedudce),, Funtnhreads(nthreadcsSum)Pos,tDi v, tuint8_ti, NdCCILn_BAlLoGOck(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads_(TREnE, tNCChL_PRrOTOe_SIaMPLdE, s2) ) | ,^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h :611t:62:i note: expanded from macro 'DEFINE_ncclDevFunc' d 611I | n RuBnWolrkBoatcch, aalgdo, Iprodto,x u.xnr)ol,l>( ).rgunr(o)u;p (g\ r oup), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDev 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | AllReduce_RING_SIMPLE_S RunWoumPosrkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PRO/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ TO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthirf (tied < saubtn) dRunWorskColl<)Fn, T, ,RedOp, Algto, Piroto, COLL_UNROLdL>().rIun(tid,n subtnB, workl); | ^o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cppc:17:1: knote: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17( | DEFItNhreadIdxE._nccxlDe)vFun,c (group(group), AllReduce _TREE_| SIMPLE_SumPostD ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PRO/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hTO_SIMPLE:670]:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] / 670 | i Nv_u8_4C , ncc ClFunc LAllRed_tuce, SiFuncSuTdmPostE(Div, PuinSt8_t,t/ NCCLi_ALGsdO_TREEi, NCCzL_PR)OeTO_SI,MoPLE f, 4()Tn) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:t254hreads:(n90thr:eads), tidInnote: Blockin instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here(thr eadId x | ^. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:254x611:62 | :) , note: expanded from macro 'DEFINE_ncclDevFunc' 611 | g Run WrorkB atoch T,, | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | s algo, proto, RedOp, FanAsymmetric, /*Direct=*/0, Proto, 0> pruniroll>()m.run()s; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:| 15: note: ^field 'nthreads' will be initialized after field 'tidInBlock' 670 | ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hd(tid), nthreads(tepSinze:(ts565tehpS:izre_ 5== e0 :? ncac lShmednote: m.commin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested heres.buf)fSi,zes[NC C Lt_ PiROTO_Sd565IMPL | E]/NCC IL n_ BS lroTcEuknP(TtSr/ehesizUreepDown, C note: Ofield 'group' will be initialized after field 'stepSize' L670 | L ti_d(tUid), nthrNeadsR(:63:nO56: Ltnote: hin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here r63 | e Praidmistives(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: Iin instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested herenBlo ck (threadI432dx | .x), group(g Symr meto ricu <1> p, 0i),, Prf oto | ,( ^~~~~~~~~~~ 0>t idprim s < | subtn) RunWorkColl().run(tid, sub ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.ht:558:5: nnote: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here ,558 | w ruonRinrg(ti ^d, n thr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cppeads, work:)17; | ^: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h1:432::78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested herenote: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | D432 | if (tid < subEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDitvn) _RunWuorkC8oll<_Fn, 4T, R,edOp , Alngo, Pcrotoc, COlLLF_uUNncRAlOlRLLed>u(c).e, ruFnu(nticSd,u msPuosbttnD, wiovrk,); u i | ^n /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cppt8_t:,12 NC:1C: L_note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here ALGO_TREE, NCCL_ P12 | RDEFIONE_TncclODevF_uncS(IMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | AllReduce_RING_SIMPLE_SumPostDiv_u8_2, ncclF RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tiuncAdllRe)duce,, Fun cSumnPosttDihv,r uinet8_ta, NCdCL_AsLG(O_RInNGt, NChCL_PrROTOe_SIMaPLE, d2) s | ^ )/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611,:62: note: expanded from macro 'DEFINE_ncclDevFunc' t611 | i RdunIWorkBatchn, algo, proto, unroll>().run(); \ | ^ p), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthrea/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:d670:15:s note: )field 'nthreads' will be initialized after field 'tidInBlock' , 670 | t tidi(tidd), nInBlock(tthreadsh(nthrreades), taidIndBlocIk(thdrexa.dx), group(group), | ^~~~~~~~~~~ Idx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ?/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Prot 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ o, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_4, ncclFuncA/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) llReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15::670 :15: warning: initializer order does not match the declaration order [-Wreorder-ctor] note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(t670 | tid(tid), inthdr), ntheardesads(n(nththreads), tidInBlock(threadIdx.x), group(groureads), tidpInBlock)(thread,Idx.x) , group(group), | ^~~~~~~~~~~~~~~~~| /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~670 | | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ tid(tid), nthreads(nthreads), tidInBlock(thr e671 | a stepSdize(stIepSize_d == 0 x? ncc.lShmemx.comm.bu)ffSize,s[N group(group), | ^~~~~~~~~~~ CCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h).:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] r670 | tiud(tid), nthreads(nthrenad(st)i,d ,t siduIbntBnl, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here ock(thread17Idx.x), g | roup(groDup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ EFI| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ NE_n671 | c c lDevF usntecp(AllReduce_TRESize(stepSize_ == 0 ? ncclShmem.comm.bE_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PuffRSizes[NOCCL_PROTTO_SIMPLOE]/NCC_L_STEPSS/sIizeof(TM) : stepPSize_)L { E| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group ,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h :463): 56 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here : 611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 63 | Prim611itiv | e RunWorkBatcs, ty, 0, rPreodop prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558>, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads( | runRing(teid,a nthrdeadss), ,w otidInBlrok); c| ^ k(threadIdx./builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:x432:78: note: )in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432, | group(group), | ^~~~~~~~~~~~~~~~~ if (tid/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h < subtn) RunWor:kC670:60: ollnote: ().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | id(tid), nthreads(nth tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: reads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threexpanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthradIdx.x), group(group), | ^~~~~~~~~~~ eads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx906. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 69%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/alltoall_pivot_sum_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/alltoall_pivot_sum_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/alltoall_pivot_sum_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/alltoall_pivot_sum_i8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_grIn file included from oup/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10(: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h):145:14: warning: unused variable 'data1' [-Wunused-variable] ; 145 | ui nt32_t d ata1, fla| g1, dat ^~~~~~~~~~~~~~~~~~a2, fla g2; /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h| ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: :unused variable 'flag1' [-Wunused-variable] 29:15: 145 | uint32_t data1, fnote: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from lag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable]In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_2, ncclFuncAl/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_2, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ lToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_2, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_2, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_4, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_4, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_4, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here In file included from 82 | r/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: uinitializer order does not match the declaration order [-Wreorder-ctor] nRing(tds(nthreads), tidInBlock(thrIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ eaid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_2, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 432 | if (tid < subtn) RunWorkCollzes[N(CCL_PR)OTO_S.IMPrLuEn]/(NtCiCdL,_S subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1:TEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_2, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 37:256: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here )37 | Pri miti| ves:, 0, 611Proto,: 0>62 prim:s | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:note: 5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested hereexpanded from macro 'DEFINE_ncclDevFunc' 82 | run Ring (tRid, nTuhnreads, work); | ^ WorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: 60in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | : if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RIN note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ G_SIMPLE_Sum_i8_2, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_2, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_4, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_2, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 37 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPrimitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 82 | runRing, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_2, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _UNROLL>(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_2, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ id < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_4, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto10 warnings generated when compiling for host. , unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Stium_i8_4, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | d(tid), nthreads(nthreads), tidInBlock(threadIdx.x), tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_4, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_4, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_4, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_4, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:37:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 37 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/alltoall_pivot.h:82:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 82 | runRing(tid, nThreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8_4, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx908. [ 69%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/broadcast_sum_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/broadcast_sum_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/broadcast_sum_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/broadcast_sum_i8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ :77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ const int w = threadIdx.x/WARP_SIZE; \ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_gIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_rgoupr()o; u| ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hp:29:(15: note: )expanded from macro 'barrier_by_group' 29 | c;on st int w = thre| adId ^~~~~~~~~~~~~~~~~~x.x/WARP_S IZE;/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h \ | ^ :29:15: note: expanded from macro 'barrier_by_group' 29 | const int w =In file included from threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | u/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t daintt32_at da1ta,1, f lag1f, data2,l flag2; | a ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] g1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h con:st 29in:t 15w =: thr eanote: dIdx.x/WARexpanded from macro 'barrier_by_group'P_S I ZE; \29 | | ^ const int w = threadIdx.x/WARP_SIZE; \ | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:19:15: warning: unused variable 'bid' [-Wunused-variable] 19 | const int bid = ncclShmnote: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from em.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:19:15: warning: unused variable 'bid' [-Wunused-variable] 19 | const int bid = ncclShmem.channelId - work->channelLo; | In file included from ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:19:15: warning: unused variable 'bid' [-Wunused-variable] 19 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:19:15: warning: unused variable 'bid' [-Wunused-variable] 19 | const int bid = ncclShm/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hem.ch:annelId - work->channelLo; | ^~~ 173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, dataIn file included from 2, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const intIn file included from w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ wIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:19:15: warning: unused variable 'bid' [-Wunused-variable] 19 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:19:15: warning: unused variable 'bid' [-Wunused-variable] 19 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:19:15: warning: unused variable 'bid' [-Wunused-variable] 19 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:19:15: warning: unused variable 'bid' [-Wunused-variable] 19 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:19:15: warning: unused variable 'bid' [-Wunused-variable] 19 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:19:15: warning: unused variable 'bid' [-Wunused-variable] 19 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:19:15: warning: unused variable 'bid' [-Wunused-variable] 19 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 97 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8_2, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 97 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8_2, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 97 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8_2, nc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 97 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8_4, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unrolclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ l>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 97 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8_2, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:111:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 111 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Broadcast_RING_LL128_Sum_i8_2, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ 611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 97 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 97 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8_4, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group( runRinggroup), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8_2, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreaIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 97 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8_2, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBIn file included from uf, outputBuf/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2,: worIn file included from k-/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h>r:ed10: OpIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hArg:,173 0, work->connInd: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(thexr, worek->caondnIInddexx);.x ),| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h :97:g5: note: roin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested hereu 97p | ( g rrunRoing(tmm.id,b ntuhrefadsf,S wiorkz); es | [ ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hN:432C:78CL_PROTO_SIM: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 60 | prims(tid, nthreadps, A,lgo , P&rotro, iCOLLn_UNgROL-L>(>).rpun(rtide, svub,tn, &worirkn)g; -| ^ >/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cppne:7:1x: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here t 7 | DE,FINE_nccl DeviFunnc(BrpoautBuf, docuastt_pRIuNGt_SBIMuPLfE_,Su wm_oi8r_2k->redOpArg, 0, work->conn, ncclFuncBroadcast, FuncSum, int8_t, NIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5CCL_ALG:O_ RInote: NG,in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here N CC L_P97RO | TO_ SI MPLE, 2) r| ^u /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hnR:611i:62n: note: expanded from macro 'DEFINE_ncclDevFunc' g<611T | , R e RdOpu, PnroWtoor,k BCaOLtLc_hy(,t rid,edop< ntty>,hr ealagdso,, wporortk)o;, u | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < sunbrotlln>()). ruRn(u);n \W | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreadorkCollu()p.(grrun(otupi),d , s| u ^~~~~~~~~~~~~~~~~ b/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.htn, work:)670:;60 : note: field 'group' will be initialized after field 'stepSize'| ^ 670/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp | : 7:1 :ti d(note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested hereti d 7), | nDtEFhIreNaE_dns(cnclthDrevFunc(eBards)o, atiddIcnBalosckt(t_hrReING_SIMPLE_Sum_i8_2, ncadcIdlx.Fx)u, ngrocupB(grrooupa),d c| ^~~~~~~~~~~a st, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 97 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8_4, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 97 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8_2, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 97 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8_4, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 97 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8_2, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:111:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 111 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Broadcast_RING_LL128_Sum_i8_2, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 97 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8_4, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmIn file included from e/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:10: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 97 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8_2, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ m.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/si/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hzeof(T) : :670:s15: warning: tinitializer order does not match the declaration order [-Wreorder-ctor] e670p | S i tidz(teid),_ n) threa{ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PRs(nthreads), tidInBlock(threadIdx.x), group(group),/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60: 7: note: | in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~60 | prims(ti| d, tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ nt hrea ds671 | , &rin OTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 97 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8_4, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ g stepSize(stepSize_ == 0 ? ->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 97 | rncunclSRhmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 60 | priming(reads, &ringti-d, n>threapdsrev, &ring->next,, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | in putB uf, i ofutp utB(tufi, wodrk- < subtn) RunWo>rrkedCOpAorg,l 0,l wo, coTnnIn,de Rx,edO p,w oArlgko,- >cPronoton,Ind eCxO)LL_UNROLL>().; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 97 | runRing, 1, 2, 4>::run' requested here C12O | DEFINLE_nLcc_lUDNeRvOLL>Fu(tindc, nt(Brhroadcast_RING_SIMPLE_Sum_i8_4, ncclFuncBroadcast, Funeadcs, wSorku); | ^m /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h,:432: 78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | i n t8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | Ru if (ntidW < osubrtn)k RuBnWoarkCotllt(y>,) .run(tid, subtn, walogrok, p)roto;, | ^un r/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cppoll>().ru:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | n(D); E\ F| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hI:670:N15: Enote: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(t_hncclDevFrunce(BraoaddcaIst_RING_SIMPLE_Sum_i8_4, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(thrdx.xead)Idx.x), ,gro up(ggrorup), | o ^~~~~~~~~~~~~~~~~ u/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:p670:60(: group)note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(th, r| ^~~~~~~~~~~~~~~~~ ea/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:d60:I note: field 'group' will be initialized after field 'stepSize' 670dx.x), group(gro | u tid(pti)d), ,nthreads(nthreads), tidInBlock(threadIdx.x), group(gr o| ^~~~~~~~~~~u p), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 97 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8_4, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 97 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8_4, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:60:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 60 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/broadcast.h:97:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 97 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8_4, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 69%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/device_table.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/device_table.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/device_table.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/device_table.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/device_table.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 11 warnings generated when compiling for gfx1030. 1 warning generated when compiling for gfx90a. 11 warnings generated when compiling for gfx1100. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx1200. 1 warning generated when compiling for gfx1102. 11 warnings generated when compiling for gfx908. 11 warnings generated when compiling for gfx906. 111 warning generated when compiling for gfx942. warnings generated when compiling for gfx1200. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx1100. 111 warning generated when compiling for gfx1201. warnings generated when compiling for gfx1201. 11 warnings generated when compiling for gfx1101. 1 warning generated when compiling for gfx1101. 11 warnings generated when compiling for gfx1102. [ 69%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/host_table.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/host_table.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/host_table.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/host_table.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/host_table.cpp 12 warnings generated when compiling for gfx90a. 12 warnings generated when compiling for gfx942. [ 70%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for host. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx942. 1 warning generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1201. 1 warning generated when compiling for gfx1200. 1 warning generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ [ 70%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp.o In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:IZ145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145E; \ | ^ | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | b:173a: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | rrie r barrie_r_by_grboup(); y| ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15:_ note: expanded from macro 'barrier_by_group' 29 | g cornoup(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = stt int w = hthreradIdx.xe/WARP_SIZE; \ | ^ adIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_grIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ oup(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:129: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h::13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: 15/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: :unused variable 'w' [-Wunused-variable] 75 | note: barriexpanded from macro 'barrier_by_group'er_by_ group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: 29expanded from macro 'barrier_by_group' 29 | cons | t int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h14: warning: :unused variable 'data1' [-Wunused-variable] 145 | 145 ui:nt3228_t data:1, fla g1, dawarning: ta2, funused variable 'data2' [-Wunused-variable]lag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h :145:21: 145warning: unused variable 'flag1' [-Wunused-variable] 145 | | u int32_ t data1 , flag 1, datau2, flagi2; n| ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:t145:28: warning: unused variable 'data2' [-Wunused-variable] 3 145 | uint32_t data1, flag1, data2, flag2; 2_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, fl | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.ha:145:35: warning: gunused variable 'flag2' [-Wunused-variable] 145 | 2 uint;32_t d ata1, flag| 1, da ^~~~~ta2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZEd), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), ), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, P{ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRYro_to, 0> Fprims U | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cppN:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3C | MSCCL__IMPDL_KERNEEL_ENTVRY_FUNRC_DEVREEDOP_TYDPE(MiOnMaPx_TYPE(MinMax, h, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work)yp;e>, Pr otoL\L128, fullOp s>(com| m, al ^go, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:: 13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:In file included from 173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hwarning: :initializer order does not match the declaration order [-Wreorder-ctor]13 : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | 670 | ti d(tid) , tid(tid), ntnthreads(nthreads), tidInBlock(threadIdx.x), group(group), hreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROT| O ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | _ stepSizeS(stepSize_I == 0 ? ncMclShmem.cPomm.buffSLizes[NCCEL_PROTO_]SIMPLE]//NCCL_STNEPS/sizeoCf(TCL_STEPS/sizeof(T) :) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNdOp, EFanAsymmLetric<1_,1>, 1,E ProtNo, 0> pTrims | R ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:Y1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here _3 | MSCCLF_IMPLU_KERNEL_NENTRY_FCUNC_DEVR_EDOP_TYDPE(MinMaEx, Vhip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, Func##/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ devre,dop, Prot oSimplPe, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tidL_SLICESTEPS, 2>, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: (tfield 'group' will be initialized after field 'stepSize'id), nthreads (nthr eads), tid670InB | lock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(ntIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ hreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flagIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCIn file included from L_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx90a. [ 70%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, fla | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ g1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from [ 70%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f32.cpp.o In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group'In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:In file included from 28:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp :warning: 1unused variable 'data2' [-Wunused-variable]: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from 145/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h | : 174 : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h :u75i:n7t:3 2warning: _unused variable 'w' [-Wunused-variable]t data1, f75l | a g 1 , d abtaar2r,i efrl_abgy2_;g r o| u ^~~~~p ()/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h;: 145 :| 35 ^~~~~~~~~~~~~~~~~~: warning: unused variable 'flag2' [-Wunused-variable] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29: 15145: | note: expanded from macro 'barrier_by_group' uint 3292 | _ t d actoan1s,t filnatg 1w, =d atthar2e,a dfIldaxg.2x;/ W A| R ^~~~~P _SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const iIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ nt w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here , Func##devredop, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.xIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | ), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx90a. [ 71%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp 10 warnings generated when compiling for gfx90a. [ 71%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_groupIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ (); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uinIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.ht32_t data1, flag:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable]In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 75 | barrier_by_group();In file included from | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1 : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h29 | const int w:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29 = threadIdx.x/WARP_SIZE; \ | ^ :15: note: expanded from macro 'barrier_by_group' 29 | const iIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ nt w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | In file included from cons/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cppt:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h :13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: i/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: nunused variable 'data1' [-Wunused-variable] 145 | t uint 32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flagw = threadIdx.xIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrie/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ r_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, Prothreads)o, wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | Yt_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ id(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: In file included from warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3),In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PRO group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1 group(group, Prot o, 0> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hprims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | :199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | PrimitiveMSCCL_sIMPL_K, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ Asymmetric<1,1>, 1, ProtoC,_DEVR EDOP_T0YPE(MinM>ax, do uble, pfalse);r | ^ ims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ unInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ In file included from | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MIn file included from SCCL_IMPL_KERNEL_ENTRY_FUNC_DEIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ VREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fu/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROllOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tiTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | PrimitivesIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter prims oup (grou| p), | ^ ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3unc##devredop, ProtoLL128, fullOps>(comm, algo, work); \ | ^ :1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ pe, Func##devredop, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ EVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(th/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpprea:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tidIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthred(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROads), TtidInBOlock(th_readIdSx.x),I groupM(group)P, | ^~~~~~~~~~~ LE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: 29 | co29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ nst int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrIn file included from ier_by_group();/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp | :1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5 ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29::15: note: expanded from macro 'barrier_by_group' 29 | warning: unused variable 'w' [-Wunused-variable] const in80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZt w E= threa;dIdx.x /WARP\_SIZE ; \ | ^ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:unused variable 'data2' [-Wunused-variable]1: 145 | uint3In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_2_tg roup(); | ^~~~~~~~~~~~~~~~~~ data/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h1, flag1, da:ta2, flag292; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h::145:35: warning: 15unused variable 'flag2' [-Wunused-variable] 145 | : note: expanded from macro 'barrier_by_group' 29 | const int w = uint32_t datIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ a1, flag1, data2, flag2; | ^~~~~ threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_gr(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ oup(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tidfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ %WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNELIn file included from _ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, ~~~~~~~~~~~~~~~~~~f | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) ullOps>( c497 | owamm, rpIanBllgo, woock(threadIdx.x/WARP_SIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ IZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flark); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gThrgead((rtid%4o)==3)u, gropup(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ ( | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 g499 | srtepSizoe(nccup), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hlSh:mem.670comm.:60: note: bufield 'group' will be initialized after field 'stepSize'ffSi 670 | tid(tid), ntzhes[NCCrL_PROeTO_LLa128]/dNCCLs(nthreads), tidInBl_ock(threadSITEPSd/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRun173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:I670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] n 670 | t tid(terpreter, id)P, nthreards(nthreoads), tidInBlock(threadIdtx.x), grouop(group),S | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ i| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | m stepSipze(stepSlize_ == e0 ? ncclS, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlocSTEkPS/siz(eof(T)t : stephSize_)r { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~e | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.ha:199:d57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here I199 | Prdimitivxes, 1, Prgoto, 0> prims | ^ r/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1o: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested hereu 3 | MpSCCL_I(MPL_KEgRNEroup)L_ENTRY_FUNC_DEVREDOP_TYP, | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ E(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(t]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ id%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, Proitzes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /MSCCL_SLICESTEPS, MSCCL_SLICESTEPS, 2>, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx90a. [ 71%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp 10 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ barri er_by_| group( ^); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' In file included from 29 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1 : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13c: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.ho:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:n75:7s: warning: unused variable 'w' [-Wunused-variable]t 75 | i bnarriter_by_In file included from g/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp: r1: In file included from wo/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13 u: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h=p:175: ( /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80)t:5:;h warning: unused variable 'w' [-Wunused-variable] r e80 | | a ^~~~~~~~~~~~~~~~~~badr riI/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.her_dby_x:gro.29up:(x);15 / | : ^~~~~~~~~~~~~~~~~~ W/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h :A29:note: 15R:expanded from macro 'barrier_by_group' note: Pexpanded from macro 'barrier_by_group' 10 warnings generated when compiling for gfx942. _ 29 | S I29conZ | st E i; \ | ^ In file included from const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from nt w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:213: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:_174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:t145:14: warning: dunused variable 'data1' [-Wunused-variable] a145 | t uiant321_t da,ta1, flafg1, ldataa2,g flag2; 1| , ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h: 145:data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, 21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, fdata2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ lag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrierIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | _ by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_, fglag2r; | o ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hu:145:28p: warning: unused variable 'data2' [-Wunused-variable]( 145 | ) ;uint 32_t dat| a1, ^~~~~~~~~~~~~~~~~~flag 1, d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hata2, f:lag292; :| ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h15:145::35: warning: unused variable 'flag2' [-Wunused-variable] note: 145 | expanded from macro 'barrier_by_group' u i 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ nt32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | consIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ t int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, expanded from macro 'barrier_by_group'f 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ lag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ int32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdxIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:.x), gro15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ up(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPLIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ _KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ dop, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KEIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ RNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, PIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ roto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple10 warnings generated when compiling for host. , fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. [ 71%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group();: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h: 13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = th data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint3readIdx.x/WARP_SIZE; \ | ^ 2_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from 10In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h75:7: :warning: unused variable 'w' [-Wunused-variable] 75 | barrier_13by_gro: up(); In file included from | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warnings generated ^~~~~~~~~~~~~~~~~~ when compiling for /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:warning: 29:gfx110215:unused variable 'w' [-Wunused-variable] . note: expanded from macro 'barrier_by_group' 29 | 75 coIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | nst i nt w = t barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' hreadIdx.x/WARP_SIZE; \ | ^ 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:1741: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:: 13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145::14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145:14:145 warning: unused variable 'data1' [-Wunused-variable] | 145 | ui nt32 _t duata1i, flnag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, ftl32_ta datga1, 2flag;1, d ata2 , fl| ag2; ^~~~~ | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | u i uinnt32t_t d3ata12, fl_at data1, flag1, data2, flag2g1,; dat a2, | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hflag2; | ^~~~~ :145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_gIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ roup();In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75::7: 80warning: unused variable 'w' [-Wunused-variable] :75 | 5 barr:ier_by_ group(warning: ); | ^~~~~~~~~~~~~~~~~~unused variable 'w' [-Wunused-variable] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29: 15: note: expanded from macro 'barrier_by_group' 29 | 80 | con st bainrrier_by_group();t w = thr eadIdx| .x/WA ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:RP_S29:15: note: IZexpanded from macro 'barrier_by_group'E; \ | ^ 29 | const in t w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:2910:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_S warnings generated when compiling for Igfx1201. ZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 72%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpIn file included from InBlock(th/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from r/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from e/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.ha:498:29:d warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] Idx.x/WAR496 | P ti_d(SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ tid), nthreads(n | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3th)reads,), wi d(tidg%WArRP_SIoZE),u warpp((group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCtidL/WARP__SIZE)S, | ~~~~~~~~~~~~~~~~~~T | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)E 497 | P SwarpI/nBlsock(ithreazdIdex.x/WAoRP_SIfZE), ( | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | | warp(tid/WARP_SIZE 498 | P r flaigThmreaid((ttidi%4)v==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stees, 1, P.burffoSiztes[oNCCL,_ PRO0TO_>LL /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:p11: r2In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hi8:13m]: In file included from s//builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175 N: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h C:498| C:29 ^L: warning: _field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cppS T496E | :P 3 S :t1/siid(tz:ide ),onote: nfin instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested heret 3 | MSCCL_IMPL_KERNEL_ENT(uiRnt6Y4__t)) { F| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ U | group(groupN /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hC:199_:57:D note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here E hV199reR | adE s(D ntOPhrPrea_idsTm),Yi wPtid(Eit(vid%MeWAisRPn<_SMTIZa,E ), xRwae,rpd (tiOidnp/Wt,AR6 P_F4SIa_ZEnt),A, s | ~~~~~~~~~~~~~~~~~~yf ma| stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)ml se497 | et )r ;iw | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpretc<1,1>, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested herearpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | er, P r 3o | MStCCLo_LIMPLL_K1ERNE2L_E8NTR,Y_F UNCf_DEuVRElDOPl_TYOPE(fpMlasig>(nMTcahroxeadm,((m tiidn%,4t)= 6=3a)4,l _ggrtoup(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | o, , f wa olrsskete))p;;S i\ z | e ^(| n ^/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h c:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter[N,CC L_PPRrOToO_tLLo12L8]L/N1CC2L_8ST,EP S/fsizueolf(luiOntp64s_t>)) ({ c | o ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ m | m group(group ,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h :a199:l57:go, work); \ | note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimIn file included from ple, fullOps>(comm, a/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:l1: gIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.ho:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidIn, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670B | lo ck (t hr eatdIidxd.x(),t gidro)up,(g ronupt),h reads(nthreads), tidInBlock(threadIdx.x), | g ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~r o | u tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ p671( | g r soteupSpiz)e(,st ep Si| z ^~~~~~~~~~~~~~~~~e_ =/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h= 0 :? 670nc:cl60Sh:m em.note: cofield 'group' will be initialized after field 'stepSize'm m. buff670Si | ze s[ NC CL _PtROiTOd_S(IMtPLiEd), nthreads(nthreads), tid]/INCnCLB_SlTEoPSc/skiz(eotf(hT)r :e satedpSIize_) {d x| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~. x| group(group) /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h,: 199:g57:ro note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Pup(group), | ^~~~~~~~~~~ rimitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlockIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ (threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | conIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_stg int w =r threaodIdx.ux/WARP_pSIZE; \ ( | ^ ); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, fIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ lag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 10 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] In file included from ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepS 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ ize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1030. In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1101. [ 72%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | In file included from barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp const int w = threadIdx.:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZx/WARPE_SIZE; \; | ^ In file included from \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | In file included from barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | con ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hs:145:28: warning: tunused variable 'data2' [-Wunused-variable] 145 | uint3int w = threadId2_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ x.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h :174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h: 75:7: warning: unused variable 'w' [-Wunused-variable] 75c | obarrienr_by_sgroup(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from t int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, fIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE;lag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t dIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ata1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gro | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ up(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ RunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] reads(nthr 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threeads), tidInBlock(threaadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, faldIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ se); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERtNype>, ProtoLL128, fullOps>(comm, algo, work); \ | ^ EL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fuIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinllOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threMaax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthredIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx90a. [ 72%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. [ 72%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ TEPS, 2>, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx90a. [ 73%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ antissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, :14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for 10 warnings generated when compiling for gfx908. gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 10 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cppw:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13 : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h=:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | t barrhier_by_rgroup();e | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.ha:29:15: note: expanded from macro 'barrier_by_group'd 29 | I codx.x/WARP_SIZE; \ | ^ nst int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t dIn file included from a/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: ta1, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hflag1,: dat75a2,: fl7ag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35:: warning: unused variable 'flag2' [-Wunused-variable] 145warning: unused variable 'w' [-Wunused-variable] 75 | barrier_b | y uint_32_t dgata1, frlag1,oup(); | data2 ^~~~~~~~~~~~~~~~~~, fl /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15:a g2; | ^~~~~note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint3In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h2_t data1, flag1:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ , data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: In file included from unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from ^~~~~/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uin:75:7t: warning: unused variable 'w' [-Wunused-variable] 3 75 | 2 b_arrietr_b datIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ a1,y _groupf(); lag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h: | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | consIn file included from t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ int w = threadIdx.x/WA145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ RP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3id%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShm 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ em.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:In file included from 1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SI/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1Z: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13E: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: )/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29:, warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | w arp(tid/WARP_SIZE), tid( tid),| nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | wawrpInBlaock(trhreadpIdx.xI/WARPn_SIZEB), | l ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE o 498 | c flagThread((tk(thried%4)=adIdx=3.), gx/WARP_roupS(grouIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flp),a | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~g | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 T 499 | h sterpSizeead((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepS(nccilShmezm.comem.buffSizes[NCCL_PROTO_LL128]/NCCL_STEP(ncclShmem.comm.buffSizes[NCCL_PROTS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ O_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ T, RedOp, FanAsymmetric<1,1>, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp::1498: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h::13: 29In file included from :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:warning: 498:29field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | 496tid | (ti d), nt hrea ds(tnthireadds), wid(t(id%tWARiP_SdIZE), nthreads(nthreads), wid(tid%WARP_SIZE), )w, awarrp(tipd/W(ARPt_SIiZE)d, /| ~~~~~~~~~~~~~~~~~~ W | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) A 497 | R P _warSpInBIlocZk(tEhre)ad,Idx .x/ WAR| P ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | wa_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThrrpInBlock(threadIdx.x/WARP_SIZE),e ad( (ti| d ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~%4) ==3 | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclSh),m groeup(mgro.up),c | o ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ m| warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3m . 499b | u stfepfSizeS(nciclSzhmeem.csomm[.bNuffSCizeCs[NLCCL__PRPOTRO_LOL12T8]/NOCCL__STLEPS/Lsiz1eo2f(u8int]64_/t))N { C | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ C | group(groupL /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57_: note: Sin instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here T199 | EPS/s Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives,A 1,s Pryotom, 0m> perimst | r ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cppi:3c:1:< note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here1 ,31>, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_ | MSFCCLU_IMNPL_CKERN_EL_DENTERYV_RFUNCE_DEDVREODOPP_TY_PE(TProYd, hPip_Ebfl(oatP16,r faolsed); , | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:h384:3i: note: pexpanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter_b>, ,Pro toLPL12r8, ofutllOops>L(coLmm,1 al2go,8 wo,rk) ; \f | u ^ llOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdxr.ox),up), | ^~~~~~~~~~~ group(gIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] roup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_ stepSize(stepSize_ == 0 ? ncclShmem.comm.bIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ uffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_)I MPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for host. [ 73%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadI/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cppd:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: xIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] . 75 | x bar/rier_by_gWroup()A; | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hR:29:15: note: Pexpanded from macro 'barrier_by_group' 29_ | cSIZE; \o ns | ^t int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizeIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthrIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, aeads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) s{ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here lgo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(cIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ omm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthre 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunadsInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_10TYPE(Prod, warnings generated when compiling for host. rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _SLICESTEPS, 2>, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx90a. [ 73%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, hIn file included from ead, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZ/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hE; \: | ^ 29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h::145:21: warning: unused variable 'flag1' [-Wunused-variable] 13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp::7:1: warning: In file included from unused variable 'w' [-Wunused-variable]/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:: 113: : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group()75; | | b ^~~~~~~~~~~~~~~~~~arr ie/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hr_by_gr:ou29p():; | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h15:29:15:: note: expanded from macro 'barrier_by_group'note: expanded from macro 'barrier_by_group' 29 | 29 c | onsIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.ht:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:i174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:n145:14t: warning: unused variable 'data1' [-Wunused-variable] w145 | =uin t32t_t hdatra1, eflaag1, ddatIa2,d fxlag.2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32 _ tconst in t w = threadIdx.x/WARP_SIZx/EWAR;P_S IZE\; \ | ^ | ^d atIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ a1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uIn file included from int32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uin/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cppt3:2_1t : daIn file included from ta/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h1,: f13la: gIn file included from 1,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h d:at174a2: , /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hfla:g2; 145| :14: ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 145 | uint32_t daIn file included from t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32a1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28:_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const iIn file included from nt w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: fullOps>(comm, algo, work); \ | ^ note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSiIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.bufzes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) {fSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199Func##devredop, ProtoLL128, fullOps>(comm, algo, work); \ | ^ | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), widIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ (tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_S stepSize(ncclShmem.comm.buffSiIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ zes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' In file included from 387 | mscclRunInterpreter/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:I, nProtBolSimple, , f u| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~l | l tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ O 671 | ps > ( scotmempSi, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15:ze (snote: tfield 'nthreads' will be initialized after field 'tidInBlock'ep Si ze_ =670 | = 0 ? ncclShmem.comm.buffSizes[ N tiCd(CtLi_d)P, RntOhTO_SIMPLE]/NCCL_STreEadPsS(/ntshizreeaodfs)(, Tti)dI nB:lo cks(tthreeapdISdxize_.x)), g{r ou| p ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~( gr| ou group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57:p), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tnote: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested herei d199( | t Pirdim)it,iv esnu, p1,( Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPLgr_ouKp)E, | R ^~~~~~~~~~~ NEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitigfx90a. ves, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 73%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: :In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:75173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7:: warning: unused variable 'w' [-Wunused-variable] 7 75 | : warning: unused variable 'w' [-Wunused-variable] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1 barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group'75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threa: In file included from d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7d: warning: unused variable 'w' [-Wunused-variable] x 75 | .barrier_xby_grou/p(); In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | W 29 | ^~~~~~~~~~~~~~~~~~ Aconst R i/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hnt w =P threa_:dISdx.x/WARIP_SIZEZ; \ E29| ^ ;: 15:\ | ^note: expanded from macro 'barrier_by_group' 29 | consIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:t int 75w = t:hre7adIdx.:x/WA RP_Swarning: IZE; \unused variable 'w' [-Wunused-variable] | ^ 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:_174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:g7: warning: unused variable 'w' [-Wunused-variable] r75 | barori/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: ueIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: prIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h_:75:7: (bwarning: unused variable 'w' [-Wunused-variable] 75)y | ; b a _rrige| r ^~~~~~~~~~~~~~~~~~r_b o/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hy_g:29upro:(15)up:;( note: expanded from macro 'barrier_by_group' 29 | co n s| t ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29 :15:); i | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hnnote: texpanded from macro 'barrier_by_group': 29:15: w note: expanded from macro 'barrier_by_group' = t29 | const int w29 | con=st i nt w t=h rtheIn file included from ardea/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cppI:d1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hd:I13: xdIn file included from x./builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:x.174/x: W//builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hWARP_SIZE; \ | ^ ARP_SIZE; \ | ^ In file included from :75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: hrenote: adIdx.expanded from macro 'barrier_by_group'x/WA RP_ SIZE; \ | ^ 29 | const int wIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint3 = 2threadI_dx.x/WtARP_S IZE; \d | ^ ata1, flag1, data2, fIn file included from lag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp::1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h: 13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174warning: : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14unused variable 'flag1' [-Wunused-variable]: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_145t data | 1, fla g1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: 1, In file included from flag1,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h data2, flag ui2nt32_t data1, flag1, data; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 2, flag2; | 145 | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, :174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:f145:14l: awarning: unused variable 'data1' [-Wunused-variable]g2 145 | ;uint 32_ t da| ta1, ^~~~~ fla g1/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h, data2, f:lag2145; | : ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h35 ::uin 145t:32_t21 dwarning: a:unused variable 'flag2' [-Wunused-variable]ta1, flag 1, dwarning: atunused variable 'flag1' [-Wunused-variable]a2, 145 fla | g2 ; 145 | ^~~~~ | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h :145u :35:i nuwarning: unused variable 'flag2' [-Wunused-variable] i145t | n 3t ui3nt3222___tt td d daaattta1a1,,a 1, ffllaagf1lag1,,g1 da, dta da2a,ta2t , a2fl,afgl2ag2; ; | ^~~~~ | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h ^~~~~ :145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_ flag2; | ^~~~~ t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] In file included from 80 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp :1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h :13: In file included from b/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: a/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: rwarning: unused variable 'w' [-Wunused-variable] r 80 | i e barrrie_r_byb_y_grogrupo(); u | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hp(:)29:;15: note: expanded from macro 'barrier_by_group' | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: 29 | note: conexpanded from macro 'barrier_by_group's t 29i | consnt w = threadIdx.x/WARP_SIZE; \ | ^t int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175In file included from : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flaIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ g1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float,In file included from false); In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthr | e^/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.ha:384::3:d 1note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' s384: | ms(ccIn file included from lnthreads), wid/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:(13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:t175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498i:d29%:RuWARP_SIZE), wa warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] r496 | p tid(tid/(tiWd), AnthrnInRteerprePtaer_, hProtoLrL128, fullOps>(comm, algo, work); \ | ^ SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThreaedads)(, wid(tid%WARP_(SIZE), warp(ttid/WARiP_SIZE)d, | ~~~~~~~~~~~~~~~~~~ % | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 4497 | w)arpIn=Block(=threa3dIdx.x/)WARP_,SIZE), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSiz | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499es[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here< 1, 1>, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:199 | Primi1tives<:T, Red Op, Fnote: anAsyin instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested heremmetr ic<1,1 3 | MSCC>, 1, ProL_IMPL_KERNEL_ENTRY_FUNCIn file included from _DEVREDOP_TYPE/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (to, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ >, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grou496p | ( tid(tgid)r, nthroeads(ntuhreads),p wid(ti)d%WARP,_SIZE), warp(tid/WARP_SIZE) , | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) | 497 | w ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~arpInBl ock(t hreadId| x tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_. x /671 | stepSize(stepSize_ == 0WARP_S IZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives64_t)), { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | 1, Proto, 0> prim group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primis | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpretern, 1,c Prot#o, 0># primds | ^e /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cppv:3:1: rnote: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here e 3 | MSdCCL_IoMPL_KpERNEL<_ENTRtY_FUNyC_pDEVREeDOP_TY>PE(Pr,od, f loat,P falsre); o | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.ht:384:3:o note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' S384imple< | mscclRunInterpreter, fullOps>(comm, algo, wotrypke, Fu)nc##de;vredo p, P ro toL| L128, ^ full Ops>(c/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.homm, algo, wo:rk); \ | ^ 670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), 10 warnings generated when compiling for gfx906. tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]In file included from 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | P r tidi(tid), nthreads(nmthreiads),t tidIniBlock(vthreeadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_s, 1, Preof(T) : steopSizteo_,) 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVRE{ | D ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~O | group(group P/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:_199T:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested hereY 199 | P PrimEitiv(es, f1, lProotaot, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' , 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMP387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm,p, ProtoSimple, ftulliOps>d(coImnBm,lo acklg(othreadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h, work:); \670 | ^: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h60:670:15:: note: field 'nthreads' will be initialized after field 'tidInBlock' note: 670 | field 'group' will be initialized after field 'stepSize' t id( tid),670 n | t h tid(tid), nthreareads(nthreads), tidInBlds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE),10 warnings generated when compiling for gfx1200. warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterIn file included from p/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ reter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grou/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \dOp, FanAsymmetric<1,1>, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(nIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ cclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 10 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx90a. [ 74%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | t y, head, mantissa; | ^ uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group()); | ^~~~~~~~~~~~~~~~~~; /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15 : note: expanded from macro 'barrier_by_group' 29 | | const i ^~~~~~~~~~~~~~~~~~n /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group't w = threadIdx.x/WAR P_29S | const inIZE;t \ | ^ w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 10 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrIn file included from iIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ er_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: :In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:,1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h fl:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.ha:174: g/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:214: warning: ;unused variable 'data1' [-Wunused-variable] 145 | | uin ^~~~~t32_ t d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:at21a1:, warning: funused variable 'flag1' [-Wunused-variable]l a g1145, | d a ta2u, inflt32_t data1, flag1, daag2; t | ^~~~~ a/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:2145:21:, warning: unused variable 'flag1' [-Wunused-variable] f145 | l uag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | intu32_ti datna1, tflag312, _datta2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t d data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1,ata 1, fflalg1,a dagta21, f,lag2 ; d| ^~~~~ a/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:t145:35a: warning: unused variable 'flag2' [-Wunused-variable]2 , f l145 | a g 2 u;i nt3| ^~~~~2_ t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp::1: note: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:expanded from macro 'barrier_by_group'13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175 29 | const int w = threadIdx.x/WARP_S: I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:Z5: Ewarning: unused variable 'w' [-Wunused-variable] ; 80 | \bar rie r_b| y_g ^rou p(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 10 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_grIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ oup(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZEIn file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ; \ | ^In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx942. [ 74%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid//builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hW:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:A175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:R498:29: warning: Pfield 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] _ 496 | tid(tiSd), nthIreaZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | ds(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | wa stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)rpInBlock(threadIdx.x/WARP_ SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | 497 f | l a warpIngThread((tid%4)==3), Bgroup(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ lock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ?In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]ple, fullO | p tid(s>(tcomm, id), ntalgoh, woreads(nthreads), tidInBlock(threadIdx.x), grrk); o\ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock'u 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0>/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%W prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter,ARP_ SIZE),P warp(tird/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~o | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) t497 | owarpISnBlocki(threadImdx.x/WApRP_SIZlE), | e ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | , fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tmeim.comm.buffdSizes[INCCL_PROTO_LL128n]/NCCLB_STEPSl/sizoeocf(uintk64_t))( t{ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~h | group(group r/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199eadIdx.x), grou:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0>p(gr oup)p, | ^~~~~~~~~~~~~~~~~r /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hi:670:60: mnote: field 'group' will be initialized after field 'stepSize' 670 | s tid (tid), nt| hrea ^ds /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp(nthrea:3ds:), tidInBlock(threadIdx.x), group(group), 1: | note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here ^~~~~~~~~~~3 | MSC CL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(thrIn file included from ead/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:d173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15:x warning: initializer order does not match the declaration order [-Wreorder-ctor] .670 | x tid(ti/d), nthWreadsA(nthreRads), tPid_ISnIZE), | Block(th ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~re a | warp(tid/WARP_SIZE 498 | flagThrdeIdx.xa), group(grodu(p()t,id%4)= | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ ===3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof 0 (? ncclSuhmem.coinmmt.bu6ffS4izes[_NCCL_PRtOTO)_SIMPLE])/NCCL_STEPS/size of{ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: (note: T) : sin instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested heretepSize _) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 199 | Primitives/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:<57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here T ,199 | R Perdimitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hic<1,1>, 1, :Pr384oto:, 0>3 pri:ms | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cppnote: :3:1expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE': note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSC CL_IMPL_KE384RNE | L_ENTR Y_FUN C_DEmVREDOsP_TYPcE(cProd,l doublRe, funInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ Func##devredop, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_groIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:up(75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group() uint32_t data1, flag1, data2, flag2; | ^~~~~ ; | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, da:15: note: expanded from macro 'barrier_by_group't 29 | a2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h: cons145t in:t w = t28hreadId:x.x/WAR P_SIZwarning: E; \ | unused variable 'data2' [-Wunused-variable] ^ In file included from 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = thrIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ eadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ P_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WAIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ RP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tidWAR)P_SIZE),, | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | n flagtThread((htid%4)==r3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ eads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), ntIn file included from hreads(nth/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cppr:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13e: In file included from ads), tidInBlock(t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hh:173r: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:e15: warning: initializer order does not match the declaration order [-Wreorder-ctor] a 670d | Itid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grodx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(groupup),) | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ , | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | s tepSi| ze(st ^~~~~~~~~~~epSiz e_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthIn file included from reads(nthreads), tidInBlock(threadIdx.x), group(gro/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cppup):, 1 | : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h ^~~~~~~~~~~~~~~~~ :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60175: note: : field 'group' will be initialized after field 'stepSize'/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h : 498670:29 | : warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads),tid( tid),w nthreads(nthireadsd), ti(dInBltock(tihreaddIdx.x%), group(group), | ^~~~~~~~~~~ WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ RedOp, FanAsymmetric<1,1>, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERIn file included from NE/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: LIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: 10 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: _/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]E NTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_S)IZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadId; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ x.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670 | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~: | group(group60 /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h::199:57 : note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here note: 199 | Pfield 'group' will be initialized after field 'stepSize'rimi tives ,tid(t 1, Pirdo)t,o ,nthrea d0> prsim(snthreads), tidInBlock(threadIdx.x), grou | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cppp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_fl(group), | ^~~~~~~~~~~ oat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadId/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ x.x) , group| (group) stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :670:60 : note: field 'group' will be initialized after field 'stepSize' 670 | 497 tid(ti | d), nth read s(nthre ads), tidInwBlock(tahrrepaInBlock(threadIdx.xd/Idx.x),W group(Agroup),R P_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE | ^~~~~~~~~~~ 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx90a. [ 74%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w =In file included from In file included from threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | ui/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ nt32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | In file included from barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = t data2, flag2; | ^~~~~ hreadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_groupIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ (); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, fIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmemalse); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ .comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthres[NCCL_PROTO_SIMPLE]/NCCL_STEeads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ PS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, :full29Ops>(:comm, algowarning: , wofield 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]r k); \ | ^496 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670 :15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid)ti,d(tid ), nntthreadhs(ntrehradseads(n)t, hwridea(tdis), tidInBlock(threadIdx.x), group(In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~~~~~~~ ), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tiIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13d): , nthreaIn file included from ds(nthr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.heads):, wid175(tid: %WARP/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h_SIZE),: warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto498:29: warning: , 0> field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]prim s | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp: 3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL496_I | MP L _K EtRiNd(tid), nthreads(nthreads), wid(EL_tENTRY_FiUNC_DdEVREDO%P_TYPE(Prod, int32W_AtRP_, falSIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZEse); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h: 384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | 498 mscclR | unInte rpretera, ProtogLL128,T fulhlOps>(rcomm, algo, woerakd)(;( tid%4)==3), group(group), \| | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ ^ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_to LL128 , fullOps>671(com | m, al go , wor k); \s | ^ tepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ unInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, fIn file included from als/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: eIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from )/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h;:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | | ^tid(ti d), /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hnthreads(:nthre387ads),: tidI3nBl:o cknote: (expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpthreadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(sreter, ProtoSimple, fullOps>(commtepSize_, == 0 ? ncclShmem.caomm.bluffSgizes[oNCCL_P,ROTO_SIMPLE ]/NwCCL_SoTEPS/rsizeofk(T)) ;: st e\pSiz e _)| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Pr670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_S:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(ntimihtivesr, 1 , Protto, 0>i primds I | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cppn:3:1B: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here l 3 | MSoCCL_IMcPL_kKERNE(L_tENTRYh_FUNCIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), _rDEVReEDOP_TaYdIdx.x), group(gPE(Prod, int32_t, false);group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | roup), | ^~~~~~~~~~~ mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), 10group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ warnings generated when compiling for gfx1102. 1010 warnings generated when compiling for gfx1100. warnings generated when compiling for gfx908. 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx90a. [ 74%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx90a. [ 75%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa;In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrieIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ r_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_gr: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | conoup(); s | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:t29:15: note: expanded from macro 'barrier_by_group' 29 | i consnt itn w = threadIdx.x/t w W= threadIAdx.x/WARRP_SIP_SIZZEE; ;\ \ | ^ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ adIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:75173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7 | : warning: unused variable 'w' [-Wunused-variable] 75 | barr ier_by _group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h :29:15 : bnote: aexpanded from macro 'barrier_by_group'rrier_by 29 | _ cogronst int up(); w = thr| e ^~~~~~~~~~~~~~~~~~a d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29Id:x.x/15In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ W: note: expanded from macro 'barrier_by_group' 29 | ARP_cSIZE;o \n s| t ^ int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZEIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARPIn file included from _SIZE)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h,:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h :498:29:w warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] a 496 | r tidp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadId(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlocx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[k(threadIdx.x/NWARPC_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flCagThreaLd((ti_d%4)==3), gProup(gRrouOp),T O _LL128]/NC| ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~C | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | sLte_STEPS/sizeopSize(nfcclShm(em.ucint64_t))omm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/siz { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here eo3f( | uintM64_tS)) C{C | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ L | _ group(group IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TY/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199P:57: Enote: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here ( 199 | P Prrimitoives, 1,4 Proto_, 0>t prim,s | ^ f/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cppal:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUse); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullNC_ODEVpREDOPs_TYP>E(Prod(, intc64_t,o falmse); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hm:384:3, : note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' a 384 | lgo, work); \ | ^ mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | gr oup(grou p), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671t | stepid(tid), nthreads(nthrSize(stepSize_ == 0 ? ncclShmem.ceomm.buffaSizes[NdCCL_PROsTO_S)IMPLE]/N,CCL_STE PS/sizetof(T) :i stepSizde_) {I | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | n group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hB:199:l57ock(: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, ?Proto, 0 > prinms c c| l ^ S/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpphmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/N:C3:1: note: Cin instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3L | MSCCL__IMPLS_KERNTEL_ENETRY_FPUNC_DESVR/EsDOiPze_ToYfP(TE()P :rod ,s tienptS64_ize_t), fal se{) | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ; group(group| ^/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | msccl199 | Primitivesreter, prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FU,C Pro_toSimDple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), groe);up( g r| ou^p )/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h, :387 | : ^~~~~~~~~~~~~~~~~3 :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :note: 670expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE': 60 : note: 387field 'group' will be initialized after field 'stepSize' | ms670c | tcild(tid), nthreaRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cppIn file included from :1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h::175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:175498:29: : warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.htid(:tid), nthreads(nthreads), 498wid(:t29i:d %warning: Wfield 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]A R P_S496 | tid(tid), nIZEt), warhp(tird/WeARP_aSIZE)ds(nthreads), wid, | ( ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) t 497 | i wda%rWARpIPn_SIZE), warp(tid/WARP_SIZE)Bloc,k(th read Idx.x| /WARP ~~~~~~~~~~~~~~~~~~_SIZE ), | | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE497 | 498 | flawarpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, In file included from Pro/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cppt:o1,: In file included from 0/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h>: 13p: rIn file included from i/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hm:s173 : | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h ^: 670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3670 | | M S C C Lt_iIdM(PtLi_dK)E,R NnEtLh_rEeNaTdRsY(_nFtUhNrCe_aDdEsV)R,E DtOiPd_ITnYBPlEo(cPkr(otdh,r eiandtI6d4x_.tx,) ,f aglrsoeu)p;( g r| o^u p), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h| : tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_384 :3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 671 | 384s | t e pmSsiczcel(RsutneIpnStiezrep_r e=t=e r0< t?y pnec,c lFSuhnmce#m#.dceovmrme.dboupfs,[ NPCrCoLt_oPLRLO1T2O8_,S IfMuPlLlEO]p/sN>C(CcLo_mSmT,E PaSl/gsoi,z ewoofr(kT)); :\ s t| e ^p Size_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ gThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads ( 670 | tinthd(tidr), nthereaads(nthrdeadss), tid)InB,lock(thre adtIdx.xidInBloc), group(kg(rtohreadup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSiPzS/siezeof(_T) :) step Size_{) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h: 199:57: | note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~199 | P rimi tiv| es group(group< T/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h, R:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199edOp, FanAsymmetric<1,1>, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYP | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, E(fProda, inlt64_ts, falese); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h):387:3;: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | | mscclR^unIn /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hterpreter, ProtoSimple,1IC: EIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h S:PrT13E: otPIn file included from o/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hS, MSCCL_SLICESTEPS, 2>, fullOp:173s: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:>15: warning: initializer order does not match the declaration order [-Wreorder-ctor]( 670 | c tiod(tidm), nthreSimpadleo,c kf(utlhlOrpeadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~s>(co mm, algo, work); \ | ^ | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:m tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_, a lgo,670 work) :;15 \ | : ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :670:15:671note: note: field 'nthreads' will be initialized after field 'tidInBlock' field 'nthreads' will be initialized after field 'tidInBlock'670 | t id(tid), nt670hread | s(nth read s), t idInBl ock(tthireadIdx.x), group(gr | o steupSizep(step)Size_, == 0 ? nccl| Sh ^~~~~~~~~~~~~~~~~m e/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hm.:c670o:m60m:.b ud(note: tfid)field 'group' will be initialized after field 'stepSize',f nt Shirea zdse(nths670 | tid(tid), n[NCCLt_PROThO_SIMrPLE]/ereNadsa)C, dCtidIsnLBl(o_cnk(thrteadIdhSx.xr)T, gerEouaPp(gdrSoups)/, ) | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h, stiz:670ie:dIof60:n( Block(tT) : stepSize_) note: field 'group' will be initialized after field 'stepSize' {670 | tid( tid),| nthr ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ehare a | group(group ds(nthread/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hs:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here ), tidInBl199ock( | t h rdPeIardidx.xIm), gdixtroup.i(groxvup), e) | s, ^~~~~~~~~~~< T, RedOp, Fagronup(Agroup)s, | ^~~~~~~~~~~ym metric<1,1>, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | coIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ nst int w = thrIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ eadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:1375:7: warning: unused variable 'w' [-Wunused-variable] : 75 | In file included from bar/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hrier_by:_group();173 | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_grouIn file included from p(); /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1 : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: In file included from note: expanded from macro 'barrier_by_group' 29 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1 : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13 : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hconst:75: 7int : warning: unused variable 'w' [-Wunused-variable]w = th r75 | eadIdx.x/WAR barriPe_SIZE; \ | ^ r_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const iIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:unused variable 'w' [-Wunused-variable] 13 75 | : In file included from barrier/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h_by_gro:up(); 174| ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29: :15: note: expanded from macro 'barrier_by_group' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h29 | : con145st int :w = thr14eadIdx.:x/WARP_ SIZE;nwarning: t wunused variable 'data1' [-Wunused-variable] = t\ hreadI d x.x/WARP| _SI ^ZE; \ | ^ 145 | uint32_t data1, flag1In file included from , data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:145:28: warning: unused variable 'data2' [-Wunused-variable] 1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h145:145:14: | warning: unused variable 'data1' [-Wunused-variable] 145 | u int32_ t data1 , flag1, data2, flag2;u | ^~~~~ i/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145n:21: warning: unused variable 'flag1' [-Wunused-variable] t 145 | 3 2u_itn tIn file included from data1, flag1, da3t2_at data12, ,flag1, data2, fflag2;lag2; | | ^~~~~ ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cppu:1: In file included from i/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:t145:14: warning: unused variable 'data1' [-Wunused-variable]3 1452 | _ t udiantt32_t d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ata1,a1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :145:28: warning: unused variable 'data2' [-Wunused-variable]In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, aIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpplgo:, work)1; \ : | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670In file included from :15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInB/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1l: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: oIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670c:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]k 670 | ( tid(ttid), nhthreadrs(nthreeads)a, dIdtxid.Inx), groBlocku(pth(greradoIup), | ^~~~~~~~~~~ dx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128] flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERN/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ EL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tIn file included from id), nthreads(nthrea/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1ds),: tidInBIn file included from loc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hk:(13t: hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:readIdx.x), group(group)175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 496 | tid(tid), nthreads(nthreads), wid(tid%WARP, _ | ^~~~~~~~~~~ SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498199 | Primiti:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ ves, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ threadIdx.x), group(group), | ^~~~~~~~~~~In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunIIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), war note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' p 387( | mscctlRunIntierpreter, | ProtoSim ple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:k670(threa:dIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSize15: note: field 'nthreads' will be initialized after field 'tidInBlock's [670 | tNid(tidC),C nthreLads(_nthPreRads), tOidInBlTock(thOrea_LL128]/NCCdIdx.Lx), g_rSoup(gTrEoPupS)/,si ze | of ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hu:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthint64r_t))e { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~a | group(group d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hs:199:57(: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here n199 | tPrimihtives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNELk_(thrEeadIdxN.x),TR groYup(gr_FUoup),N | ^~~~~~~~~~~ C_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx90a. [ 75%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = th | r coensta int w = thdreadIIdx.xd/xW.ARP_xSIZE/;W \ A R| P ^_ SIZIn file included from E; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:ui174nt3: 2_t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h da:ta175,: fl7ag:1, d atawarning: 2unused variable 'w' [-Wunused-variable], fl ag2; 75| ^~~~~ | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h: 145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uin t32_ tb adatra1,r ifleag1r, d_atba2, yfla_gg2r; o| ^~~~~ u/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hp(:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, da)t; a | 2 ^~~~~~~~~~~~~~~~~~ ,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: 29:f15:l note: expanded from macro 'barrier_by_group' a29g | 2 ; c on st| i ^~~~~nt w/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h = thr:eadIdx.x/WARP_S145:IZ35: warning: E;unused variable 'flag2' [-Wunused-variable] \145 | | ^ uintIn file included from 32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flagIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx90a. [ 75%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cppIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter| o,c kP(rtohtroeLaLd1I2d8x,. xf/uWlAlROPp_sS>I(ZcEo)m,m , | a ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~l g o| , warp(tid/WARP_SIZE work); 498\ | | ^ flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid),3 | MSCCL_IMPL_KERNEL_ nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == ENTRY_FUNC_0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group DEVREDOP_TYP/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group();1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = thre:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173a: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | con st int w = threadIdx.x/WARP_SIZE; \ | ^ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ dIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group();/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uin ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:t29:15: 32_note: expanded from macro 'barrier_by_group' t 29 | const in t w = dthreadIdx.x/WARP_SIZE; \ | ^ ataIn file included from 1, flag1,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] d ata2, fla75g2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h: | 145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | u int32_t daIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t bata1, flrragi1er_by_, gdata2rIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] oup, fl(); ag2; | | ^~~~~~~~~~~~~~~~~~ ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:: data1, flag1, data2, flag2; | ^~~~~ 145:3529: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp::1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h15warning: :13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hunused variable 'flag2' [-Wunused-variable]: note: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] expanded from macro 'barrier_by_group' 145 | 29 | :174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hu:145:14: warning: unused variable 'data1' [-Wunused-variable]i 145 | uinn145 | uint32_t data1, flag1t32, data2, flag2; _tt | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_tdata1, flag data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uin13,2_t d daata2ta1,, flagflt32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, daag2; co nsta2, flag2; | ^~~~~ 145 | t| uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ i ^~~~~nt w = thr eadId/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hx.x:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t da/WARP_SIZE; \ | ^ 1, data2, flag2; | ^~~~~ ta1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uiIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from nt32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, daIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] ta2, fla 145 | uint32_t data1, flag1, dag2; ta2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | u | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145int32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32:28: warning: unused variable 'data2' [-Wunused-variable] 145 | _t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t uint32 data1, flag1, data2, flag2; | ^~~~~ _t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIn file included from ^ Idx.x/WARP_SIZE; \/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp: | 1 ^: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int wIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:In file included from 199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from :3:1/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: :field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tidnote: ), ntin instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MhreaSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ ds(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13KER: NEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tiIn file included from d%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreadIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tTYPE(Prod, uint64_t, fid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInalse); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterprBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%e4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3ter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ s(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ tid(tid), nthread s(nthreads), tidInB671 | lo ck(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSizstepeSize(stepSize_ == (0 ? nccslShmem.tcomm.buffSizeespSize_ == 0 ? ncclS[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | hmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 10 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]10/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx90a. [ 75%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | cons/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1t in: t w =In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7 th:readIdx.x /WARPwarning: unused variable 'w' [-Wunused-variable] 75_SIZE | ; \ barr | ^ ier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = In file included from threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barriby_geroup(); r | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:_29:15: note: expanded from macro 'barrier_by_group' b29 | coynst int _w = thregadIdx.x/rWARP_SIZoE; \ | ^ In file included from up(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:_1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145: dat14: warning: unused variable 'data1' [-Wunused-variable]a 145 | 1 uint,32_t dat a1, flag1f, data2,l ag1,flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | data 2, flag 2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145: 35: warning: unused variable 'flag2' [-Wunused-variable] u 145 | i uint32n_t datta1, fl3ag1, d2ata2, _flag2;t | ^~~~~ data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.xIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flagIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | 2; | ^~~~~ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdxIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ .x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ x.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 75%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizeIn file included from s[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(grouIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ p), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) :LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | P stepSirze_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ imitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> pri/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hm:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] s496 | | ^In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ tid3(tid), | nthreadsM(nSCCL_IMPthrLeads),_ wid(tid%WARP_SIZE), warp(tKERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreteid/WARP_rSIZE),< | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)t 497 | yp wearpInBl,ock(thre adIdx.xF/WARP_SIuZE), | n ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498c | fla#gT#devredop(tid%4,)== ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthrea_dLL128s]/NCCL(_STnEPS/sitzeof(huint64r_t)) e{ | a ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:s199:57: )note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199, | Pr imittiidves , 1, Protto, 0i> prdims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KER(Ntid)E, ntLhrea_ds(nEtNTRY_FUNhreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ C_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ EL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthread10s(nthreads), tid warning/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13InBlock(threadIds generated when compiling for host: . xIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid).x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid),, nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(ste nthrpeads(nthrSeads), tidiInBlockz(threadeIdx.x), gr_oup(group) , | ^~~~~~~~~~~ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grouIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ p(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const intIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t dataIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 1, flag1, data2, fla 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ g2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ uint32_t data1In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ , flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | baIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ rrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrierIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ _by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable]In file included from 145 | uint32_t data/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: 1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hwarning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_gro:up(); | 145 ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h::29:15: note: expanded from macro 'barrier_by_group'35 29 | : const i nt w = twarning: hreadIdxunused variable 'flag2' [-Wunused-variable].x/ 145WA | RP_ SIZEu;int3 2\ | ^_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthre) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ ads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uintIn file included from 64_t)) {/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp: 1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h: 13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h| :175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~:498: 29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496| | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here: 13 | MS: CCL_IIn file included from MPL_K/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hERNEL:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: _ENT/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tidRY_(FUNC_tDEVREiDOP_dTYPE(Su)m, hiIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ ,p_ nbfloat16, false); (| thr^eadId x.x/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | : warp(tid/WARP_SIZE 498384 | :flag3Threa:d((ti d%4)=note: =3), expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE'group (grou p), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | 384 warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 thre | ads( nthr499 eamds), swid(tc | id%Wc ARP_l SIZER ), wu arp(ntsid/ItWAnterpreteepSirze(, 3Proto)LL128,, ful lOpgs>(cormm, aolgo, uwork)p; \ (| ^ group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3t64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, P r499 | o tsteopSi,ze( nc0clS>hme m.cpomrm.biuffmSizses[ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_INCMCL_PPROTLO_L_L12K8]/ENCCRL_SNTEPES/sLize_of(EuinNt6TRY_FUNC_DEVRED4_Ot))P { _ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~T | Y group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hPE:199:(57Sum, hip_bfloat16, fa: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ lse); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp :3:w1: onote: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here r 3 | kMSCC)L_I;MPL _KE\RNE L_E NT| RY_ ^FUN C_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSize 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ s[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57In file included from In file included from : note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:,13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hIn file included from 1, Proto, 0>:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h: 670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] p rims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 670 | 3 ti | d(tid),M nthreSads(CCL_IMnthreads),In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: :In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: 175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:warning: 29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] initializer order does not match the declaration order [-Wreorder-ctor] 496 | tid (tid), nthreads670(nthreads), wid(tid | %WARP_ SI tid(tiZE)d, warp)(ti, nthreadd/WARPs_SIZP(L_KEERNn)EL_ENT,RY_FUN C_DtEV REDhOP| _TYrP ~~~~~~~~~~~~~~~~~~E(Suem , hiap _bflod| at16,s stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) false) ); , | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h: 387:4973: tnote: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' | idInBlock( t wahrpI n r387 | B mesccllRaunIontde tcriIdInBkpdlock(rx(thrte.eadhItxdx.rxe)), e, rO_ SIM,P LE]/ | NC), warp(tid/WARP_SIZEPC | rL ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ o_| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_S t498oT 671E | S | P im pSl/s i efz, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here, m| ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ .buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : ste| warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3CCL_SLICESTEPS, 2>, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p S499i | z este_pSi)ze(n 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ccl{Shm em. com| m. ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~buf fS ize| s[NCCL_ group(groupPRO TO/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h_LL128]:/NC199CL:_ST57EPS:/siz eonote: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> RepdOpr, FainAsms | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here ymmet3ric | <1,M1>,S 1,C PrCotoL, _0IMPL_KERNEL> p_rimEs N T| ^ R/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cppY_FUNC_DEVREDOP_TYPE(Sum, hip:3_:b1: note: fin instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here l3 | oMSCCaL_ItMPL1_KER6NEL,_EN TRYf_alse); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRFUNuC_DnEVRIEDOnP_TtYPEe(Surm, phipr_bfeloatt16,e fral, ProtoSimple, SProt,oLL 1MSCCL_28S, fLullIOpsCESTEPS, 2>, fullOps>(com>(cmomm,, algao, lworgk);o \ , | ^ work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizeIn file included from s[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | _KE RNEL_ENT RY_FUNC_DsEVREDOP_TtYPE(Sum,e hip_bflopat16, faSlse); | ^iz /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.he(stepSize_ ==:387:3 : note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 3870 | ? ncclShmem.co mscmm.buffSiclRunInzterpreteer, ProtoSimple, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, ProtoL_S,LICES TEPS,0 2>, >fullO ps>(cpomm, ralgo, iworkm); \ s | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h: 670:15: | note: field 'nthreads' will be initialized after field 'tidInBlock' ^670 /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_ | F tUid(tiNd), ntChreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: _DEnote: VREDfield 'group' will be initialized after field 'stepSize'OP_T YPE( Sum, hip_bflo670at16 | , f alse) ; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h :387:tid(tid), n3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, PrototShreiads(nmthrepads)l, tiedInBl, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx90a. [ 76%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx906. In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | cIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ onst int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1,10 warnings generated when compiling for gfx1030. data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, fl/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:a1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hg:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h2:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h;:75: 7: warning: unused variable 'w' [-Wunused-variable] | 75 | ^~~~~ b/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.harrier_b:y_145g:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1,roup(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hIn file included from :173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h75:7:: warning: unused variable 'w' [-Wunused-variable]13 75 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h: 75 bar:ri7: warning: unused variable 'w' [-Wunused-variable]e r_b y_75 | g roup(b); a | ^~~~~~~~~~~~~~~~~~rrier_by /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:_29:15:g rnote: oup(expanded from macro 'barrier_by_group' 29) | ; | ^~~~~~~~~~~~~~~~~~ co n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:st int w = t29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | hr ^ead Idx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t dataIn file included from 1, fla/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ g1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp in:t w1 = : thrIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:e173adI: dx/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h.x/:WA75:7: warning: unused variable 'w' [-Wunused-variable] RP _SIZE;75 \ | | ^b aIn file included from rrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ reads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | In file included from stepSize(s/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:epSize_ == 0 ? ncclShm13: eIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hm:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h.:498c:29: owarning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] m496 | m.tid(tid), nthbuffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)read s(nt:hrea ds),s witd(teid%WpARP_SSIZE)i, wazrp(teid_/WAR) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0P_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), grou> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested hereIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 3 | MSCCLp(g_roupI), M| ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ P | L warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 _499 | K EstRNEL_ENTRY_FUNC_DEVREDOP_TYPeEpSi(ze(SncculShmmem,.co mm.rbufccfSilzes_[NCbCL_PfRloat8, false);OTO _LL 128| ]/N^CCL _ST/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hEP:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here < 199t | yPripmite>ive,s , 1,2 P>ro,to, 0> fpriums l | ^l /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cppO:p3:1s: >note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here ( 3c | MSCoCL_ImMPLm_K,E algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreaRNEdL_EsNTR(Y_FnUNCt_DEhVrREDeOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | ads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidImsnccBlRlunoIcntker(prtetehrr, oPruotpo(LL1g28r,o fuulplO)ps,>( co mm| , ^~~~~~~~~~~al go, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ Size_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx90a. [ 76%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uintIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175In file included from : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:80173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; :5:\ warning: unused variable 'w' [-Wunused-variable] 80 | bar rier_| by_gr ^oup(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_gIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ roup(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp21:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: :In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75: 7: warning: unused variable 'w' [-Wunused-variable] warning: 75 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ unused variable 'flag1' [-Wunused-variable] barrie r_by_gr oup(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:14515: note: expanded from macro 'barrier_by_group' 29 | | con st int w uint32_t = threaddIdx.ata1x/WA, flag1,RP_SIZE datIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ a2, flag; \2 | ^ ; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ IZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cppIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = thIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ readIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 10In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | step warningsS generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1030. ize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | w10 warnings generated when compiling for gfx1200. arpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work);In file included from \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ unc##devredop, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBloIn file included from ck(threadIdx.x), grou/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cppp(g:rou1p),: | In file included from ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: :warning: 670:60initializer order does not match the declaration order [-Wreorder-ctor]: note: field 'group' will be initialized after field 'stepSize' 670 | 670 | tid(titdid()tid,), nthnreatdsh(nthrreaeds)a, tiddInsBl(nthreads), tidInBlock(threadIdx.x), group(gocrk(threadIdx.x), group(group), | ^~~~~~~~~~~ oup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | 10 warnings generated when compiling for gfx908. stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x)In file included from , group/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.b(group), | ^~~~~~~~~~~ uffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. [ 76%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | ba/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ rrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13In file included from : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group| ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h(:);145 | ^~~~~~~~~~~~~~~~~~: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_S,I daZtEa2,; fl \ | ^ ag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group( )/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ; | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ [ 76%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), groupfalse); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ (group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, manti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ ssa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | bIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_bayrrier_by__grIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ oupg(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hrIn file included from :29o:15: note: expanded from macro 'barrier_by_group' 29 | con/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ust int wp = thread(Idx.x/WA)RP_SIZE;; \ | ^ | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARPIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ _SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizesIn file included from [NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:1,13 P: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.hrIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MS:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ CCL| _IMPL_K stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)ERNEL_E NTRY_FU NC_DEVREDOP_TYPE(Sum, 497double, | false ); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h warpInBlock(threadIdx.x/WARP_S:384:I3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' Z384 | mscEclRunI)nterpre,ter, tiProtoLL128, fullOps>(comm, algo, workd%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128); ]\ | ^ /NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(In file included from thread/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1Idx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffS: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ izes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ In file included from | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13:: 199:57: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hnote: :173: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h : 199 | P670r:15: iwarning: initializer order does not match the declaration order [-Wreorder-ctor] m it670ives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE), (group(Sgroup),u | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ m| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ ,671 | s tepSizde(steopSize_ u== 0 ?b ncclSlhmem.coemm.buf,fSiz esfalse); [N| CCL_P^ROT O/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h_S:IM387:PL3E:] note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRun/NCCIL_STEPnS/sizetof(T)er :p reter, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | dop, ProtoSimple, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ S, MSCCL_SLICESTEPS, 2>, fullOps>(comm, algo, work); \ | ^ Pri mitives, 1, P:roto,670 0> pr:ims | 15 ^ :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSnote: CCL_Ifield 'nthreads' will be initialized after field 'tidInBlock'MPL_K ERNEL_ E670 | tid(tid), In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ nNTRY_tFUNhC_DEVRrEDOeP_TaYds(nthPEr(Sum,eads do)ubl, et,i dfalse); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE'InBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreadIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: sIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3In file included from : note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp>:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:(13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: c/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: owarning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] m496 | mtid(tid),, nthreads(n tahlgo, worreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | k ); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :670:15:w note: field 'nthreads' will be initialized after field 'tidInBlock' a670 | tird(tid), nthrepaIds(nthreads),nBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock (| warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buthreafdIdx.fx), groupS(group)i, | ^~~~~~~~~~~ zes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buf10 warnings generated when compiling for gfx1030. fSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx90a. [ 77%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, :12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10In file included from warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:1: In file included from :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: 75In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173:: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:757:7: :warning: unused variable 'w' [-Wunused-variable] 75 | warning: unused variable 'w' [-Wunused-variable]barri er_b y_group75( | ) ; | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hb:29:15a: note: rrexpanded from macro 'barrier_by_group' 29 | const inier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ t w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:note: 1expanded from macro 'barrier_by_group': In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h :13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: 29/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75 | :7: warning: unused variable 'w' [-Wunused-variable] 75 | c boIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | baranrrsiIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ter _byi_grnrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ otup() ; w| = threadIdx.x/WARP_SIZE; \ ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h| :29 ^:15: note: expanded from macro 'barrier_by_group' 29 | const int w = tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ hrIn file included from eadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | u/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cppi:1: nIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:t13: In file included from 3/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: 2/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145_:14:t warning: unused variable 'data1' [-Wunused-variable] 145 | d a uitnt3a2_t data11, ,fla g1, dafta2, flag2l;a g| 1 ^~~~~, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hda:t145:a212:, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h warning: unused variable 'flag1' [-Wunused-variable] : 145145 | : 28 : uinwarning: t32_unused variable 'data2' [-Wunused-variable]t da145ta1 | , f uliag1, datnta32_2t , fdaltag2;a1, fla| ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hg:1451, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ [ 77%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL1In file included from 28]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNE/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:L13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h_:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] E670 | tNid(tidT), nthreadRs(ntYhread_s), tiFdInBlockUNC_DEVREDO(threadIPdx.x),_ gTrYoPE(Sum, rccl_float8, false); | up(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid)In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ , nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ KSTEPS/MSCCL_SLICESTEPS, MSCCL_SLICESTEP/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' S, 387 | mscclRunInterprete 2>, r, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ s>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENT496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ RY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ rier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = thre daata1, flag1, data2d, flag2Idx; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ .x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: In file included from unused variable 'data1' [-Wunused-variable] 145 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | In file included from ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | : tid(ti3d), nthr:eads(nthre1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here ads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warp3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, Ptidr%4)==3o)t,o Simple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(thTEPS/srizeof(euint64a_t)) d{ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ I| group(group d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199x:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here. 199 | x )Primiti,ves, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ :60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThr670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEead((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | PrimitivesPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_K, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3:ERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, ProtoLL128, fullOps>(comm, algo, work); \ | ^ ICESTEPS, MSCCL_SLICESTEPS, 2>, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t))In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp :1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeIn file included from of(T) : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: sIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] e 670 | p S itze_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:id(57tid), nt:hreads(nt hreadsnote: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, ioup(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ n| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | t stepSi3ze(stepSi2ze_ == 0 _? ncclSthmem.c,omm.buffS izes[fNCCL_PROaTO_SIMPLEl]/NCCLs_STEPS/sizeeof(T) :) stepSize_); { | ^| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h :387| :3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | msc group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | PrimitivclRunInterpreter, ProtoSimpleanAsy,mmet ric<1,f1>, u1, Prloto, 0l> primsO | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cppp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCsL_IMPL>_KERNE(L_ENTRYc_FUNC_oDEVREDmOm,P algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670_TYPE(Sum, int | 32_t, f alse); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | ms tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), ntchclRunInrterpreeter, tProtoShimple, fuIllOpsnB>(lococmk(threadIdx.x), group(group), m, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:| ^~~~~~~~~~~ 15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1102. 1010 warnings generated when compiling for gfx1100. warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1101. [ 77%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx90a. [ 77%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, headIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ , mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadId/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | constx.x/WARP_SIZE; \ | ^ int w = t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:h1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hr:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: ewarning: unused variable 'w' [-Wunused-variable] 75 | a barrierd_by_group(I); | ^~~~~~~~~~~~~~~~~~ d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: x.x/WARP_SIZE; \expanded from macro 'barrier_by_group' 29 | const | ^ int w = threadIdx.In file included from x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.huint32_:t y, hea13d, man: tissa; In file included from | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_bIn file included from y_g/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:r12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.ho:77:18:up(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: warning: unused variable 'y' [-Wunused-variable] 2977 | : 15: note: expanded from macro 'barrier_by_group' 29 | c o In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: uintn32_t y,s head/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ t int w = threadIdx.x/WARP_SIZE; \ , mantissa; | ^ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: :13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h::174: 145:14: warning: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:unused variable 'data1' [-Wunused-variable]75:7: 145 | uint32_t dwarning: unused variable 'w' [-Wunused-variable] a75 | tbarrier_ab1, flag1, daty_groupa(); 2| ^~~~~~~~~~~~~~~~~~/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from ,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h: 13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hf:l:75ag2; 29:15: note: expanded from macro 'barrier_by_group' 29 | :7: warning: unused variable 'w' [-Wunused-variable] c 75 | o bansrrtier_ | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] i145nt w = | threadId x.x/WAR P_SIZE; \ | ^ uint32_bty_group( ); | ^~~~~~~~~~~~~~~~~~ d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: aexpanded from macro 'barrier_by_group' 29 | t consta int w 1= threa,dIdx.x/W ARP_SIZfE; \ | la ^ g1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ , flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | conIn file included from st int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cppIn file included from :1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ :12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ _t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp,:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:f7: warning: unused variable 'w' [-Wunused-variable] l75 | abarrier_by_ggroup(); 2 | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h; | ^~~~~ :29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = thrIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: eadIdx.In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hIn file included from :145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_b: In file included from y/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: _warning: unused variable 'w' [-Wunused-variable] 80 | g barrrier_by_goroup(); u | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hp:29:15: note: expanded from macro 'barrier_by_group' 29 | c(ons:145):28: twarning: unused variable 'data2' [-Wunused-variable] ; 145 | | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:in15t :w = th r note: e uiexpanded from macro 'barrier_by_group'ant32_ dt dIata1d, flagx1, da.ta2, fx29lag2; / | | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h W:145:35:A warning: unused variable 'flag2' [-Wunused-variable] R 145 | P ui_cnt3S2onst int wIZE; \ | ^ _t data1, flag1, data2, flag2; | ^~~~~ = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZEIn file included from ; \ | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp: ^1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h: 13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175In file included from : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1), wi: d(tid%In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable]WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ In file included from | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~.x/W ARP_S/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | : warp(tid/WARP_SIZE 498145 | fl:agThread((tid%4)=21=3), gro:up(gro up), warning: | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3unused variable 'flag1' [-Wunused-variable] 499 | s tepSize145 | uint32(nccl_Shmem.tcom dm.ata1, flag1, dbauffSitzes[NCCaL_PR2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hOTO_LL128]/:NCCL_145ST:28: warning: unused variable 'data2' [-Wunused-variable]EPS/s iz 145 | uint32_t deof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hata1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ DOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | constIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int In file included from w/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:=175: threadIIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ dx.x//builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:W5: warning: unused variable 'w' [-Wunused-variable] A 80 | barrier_by_group(); RP_SIZE; \ | ^ | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t dIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ata1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE NEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter,( nccProtoSimpllShmeem.com, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | PrimiESTEPS, 2>, fulIn file included from lOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthretiaves, d1, PIrotno, 0B> plock(threadIdx.xr)ims , | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cppg:3:1r: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here o up(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 3 | MSC670CL_I | MPL_ KERN EL_E NTRY _FUNtC_DEiVRdED(tid), nthreads(nthOP_TYPE(Sum, int64_t, false); | ^/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp :1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175:: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:3845: warning: :unused variable 'w' [-Wunused-variable] 380 | : barrnote: ierexpanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE'_by_ gro up();384 | ^~~~~~~~~~~~~~~~~~ | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: 29:15: note: expanded from macro 'barrier_by_group' m29 | cosnst ciclRunInterpretent w = threadIdx.x/WARP_SIZE; \ | ^ reads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ r, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ reter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ threads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ id), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ RY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NIn file included from CCL/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: _In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.hP:498:29: warning: Rfield 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | O tiTO_LL128]/NCCL_STEPS/sizeof(uint64_t)d(ti)d), nthr eads(nt{hreads), wid(tid %WARP| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: ), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~note: | warp(tid/WARP_SIZE expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE'498 | flagT hread((tid384%4)==3) | , grou p(grou p), m | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ scclRunInter| p warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | sterpSizee(nctclShemem.rcomm<.buftfSizyes[NpCCL_ePROT,O_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here Func##devredop, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STIn file included from EPS/sizeof(T) : stepSIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group ize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPnote: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_L_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ IMPL_K/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: EIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173R: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]N 670 | E tid(tidL), nthrea_ds(nthreaEds), tidINnBlock(thTreadIdx.Rx), groupY(group), _| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ FUNC_DEVREDOP_TYPE(| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ S671 | sutepSize(smt, int8_t, false); | ^epSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | PrimitivetidInBlock(threadsI, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx90a. [ 78%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx90a. [ 78%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mant/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ issa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173In file included from : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h::1375: :In file included from 7/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:: 173warning: : unused variable 'w' [-Wunused-variable]/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_b y75_ | g r o u p ( )b;a r r| i ^~~~~~~~~~~~~~~~~~e r_by/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h_:g29r:o15u:p (note: )expanded from macro 'barrier_by_group'; | ^~~~~~~~~~~~~~~~~~ 29 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hc:o29n:s15t: inote: nexpanded from macro 'barrier_by_group't w = t29h | r e a d Icdoxn.sxt/ WiAnRtP _wS I=Z Et;h r\e a d| I ^d x.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrieIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ r_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oup(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ hreadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, dataIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from 2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx90a. [ 78%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1102. [ 78%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cppIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ :1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, daIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ta2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uiIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from nt64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:384:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 384 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:199:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 199 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:387:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 387 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ x.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_bf16_2, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_bf16_2, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx90a. [ 79%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cppIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11warning: : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 10In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_bf8_2, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_2, ncIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ clFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(RedIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.huce_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_bf8_2, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | In file included from stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduce, FuncMinMax, rccl_bfl/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(thoat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ readIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads),/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tid tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ InBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 79%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ :77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] In file included from 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = thrIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cppeadIdx.x/WARP_SIZE; \ | ^ :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_2, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_f16_2, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_2, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_2, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_4, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_2, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_2, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_2, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_2, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_f16_2, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_4, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_2, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_2, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_4, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ck(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_2, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_2, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_4, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_4, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, pro/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_4, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdxto, unroll>().x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ .run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_4, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_4, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_4, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_4, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16_4, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 11 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx908. [ 79%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp 11 warnings generated when compiling for gfx942. [ 79%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32In file included from _t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, headIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa;, mantissa; | ^ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARPIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | c_SoIZE; \ | n ^ st int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | cIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ onst int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:29:15: note: expanded from macro 'barrier_by_group' : 29 | 2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | const in t w = thr eadIdx u.x/WARP_SIZEint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, fl; \ | a ^ In file included from g1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | u/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1,int32_t data1, flag1, data2, flag2; | ^~~~~ data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable]In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp: 75 | 2 barr: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: iIn file included from er_by_gr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.ho:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7u:p(); | ^~~~~~~~~~~~~~~~~~ warning: unused variable 'w' [-Wunused-variable] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h75:29:15: | note: expanded from macro 'barrier_by_group' 29 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp=:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2;In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, dIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ata2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w =In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | bar threadIdx.x/WARP_SIZE; \ | ^ rier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WAR/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:P_2SIZE; \ : | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | t data1, flag1, data2, flag2; | ^~~~~ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] rier_by_75group(); | | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: 29:15: note: expanded from macro 'barrier_by_group' 29 | c onst in t w = thr eadIdx.x/ WARP_SbIZE; \ | a ^ rrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hdx.x/WA:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ RP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable]In file included from 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from ier_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_2, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_4, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | In file included from prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_2, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64_2, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tiIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->cd), nthreads(nthreads), tidInBlock(threadIdx.x),onnIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkC group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreadsol(lnthreads), tidInBlock(threadIdx.x), ().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_f32_2, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, worIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_2, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ k->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64_2, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_f32_2, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_2, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670\ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nt:15: hreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthrewarning: initializer order does not match the declaration order [-Wreorder-ctor] ads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | roup(gro up), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ s | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | t stepSize(setepSize_ ==p 0 ? nccSlShmem.comim.buffSizezs[e(stepSizNCCeL_PROTO_ == 0 ? ncclS_SIMhPLE]/NCCL_STmem.coEPS/smm.bizeuoffSif(zT) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hes[NCCL_PROTO_SIMPL:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tidE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, wo,r nthreads,k &ring->pr-ev, &ring->>next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRingconnIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(Ltid, n>thread(s, workt); | id ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:,432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | n ithreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | f (t id < s if (tid < subtn) Ruubtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1n:Work Collnote: , 1, 2, 2>::run' requested here T, RedO p,7 | D AlEgo, FProtIo, CNOLL_EUNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here _nc7clDe | vFunDc(ReEducFe_RIING_SNIMPLEE__MinMnax_fc32_2c, lDevFunc(Reduce_RING_SIMPLE_nccMlFuincRenduce,M FunacMinxMax,_ flofat, 6NC4_2, ncclFuncReduce, FuncMinMax, doCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, uble, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatchto,, unro ll>(a).runl(); g\ | o ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h,:670:15 : note: proto, unroll>().run()field 'nthreads' will be initialized after field 'tidInBlock' ; 670 | \tid( tid ), n| thre ^ads( n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid),th reands),t tidhInBlrock(ethreaadIddx.x)s, gr(onthreadup(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), s), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x)In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15:, group(group), | ^~~~~~~~~~~ tid warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:InBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_2, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_2, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_2, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64_2, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64_2, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncc group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_2, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ lDevFunc(Reduce_RING_SIMPLE_MinMax_f32_4, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_2, n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncccclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ lShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64_4, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->conn/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIndex,:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.he:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64_4, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ work->connIndex/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] ); | ^ 670 | tid(tid), nthr /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | eads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_4, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) Ru tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ n671 | WstepSizeo(stepSirze_ == k0 ? ncclCShmem.coomm.buflfSizes[NlCCL_PRO, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here R33 | e primdOp, Als(tid, nthreads, &ring->prev, &ring-go, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_nc>necxt, wlork->Dsendbeuff,v workF->recuvbuffn, workc->red(OpArgR, 0, ewoduce_RING_SIMPLE_MinMax_f64_4, ncclFuncReducerk->,connI ndex, Fwork->uconnInndex)c; | ^M /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:i63:5: nnote: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63M | arux, double, NCCL_ALGO_RING, NCCL_PROnRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432TO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, pr:78o: note: tin instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here o432 | , u inf (trid o< slubtln) >Run(Wor)kCo.ll(d).rxun(.tidx, s)ubtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_4, nc, group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ clFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_2, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | pr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_4, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(:t33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64_4, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ id, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grou5 | DEFpINE_nc)clDevF,unc(R e | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | steducep_RING_SLL128_iMinMaxz_f64_2,e ncclFu(ncRedsuce, FutncMinMeax, doubple, NCSCL_ALGiO_RINGz, NCCLe_PROTO__LL128 , 2) =| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:=611:62: note: 0 ? ncclShexpanded from macro 'DEFINE_ncclDevFunc' m 611 | e m.comRunWorkBatch, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims( redop, algo,t protoi, unrodll>().,run(); \ | n ^ threads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_4, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | runRi ng< T, Re dOp, Protos, COLtL_UNReOLL>(ptid, Snthreaids, zworke); | ^( /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hs:432:78:t note: epSize_ == 0 ? nccin instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here l432 | S h if (mtidem.co < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64_4, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Proto, COLL_UNROLL>().rmum.bun(tid, suffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_4, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ &ring->next, work->senbtnd, wobrk);u | f ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cppf:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here , 12 | DEFIwNE_nocclDervFunkc(Re-duce>_RINGr_SIMePLE_cMinMavx_f3b2_4,u nccflFunfcRed,uce, FuncMinMax, float, NCCL_ALGO_RING, NCCLwor_k->rPedOpRArg,O 0, TworkO->co_nnInSdex,I MPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | Rwork->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nutnWorhkBatrch, a lgwo, prooto,r unrkoll>)().r;un() ; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :670:<15: note: field 'nthreads' will be initialized after field 'tidInBlock' s 670 | u btid(ttid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | n) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_nc tid(clDevFunc(Reducteid_), nRthreIadsN(nthrGeads_), tSidInIBlocMk(thPreadLIdx.Ex), _grouMp(grioup)n, Max_f64_2, nc | ^~~~~~~~~~~ clFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work);In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64_2, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | R | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_4, ncclFuncReduce, FuncMinMaunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ x, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_4, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64_2, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32_4, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | In file included from ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: 173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670 :15: warning: initializer order does not match the declaration order [-Wreorder-ctor]s tepSize(stepSize_ 670 | = ti=d(tid ), nth0re ?ads ncclShmem.com(nmthrea.ds), btidInBulock(ffSithrezes[NCCL_PROadTIdxO.x), _groSIMPuLp(gE]/roup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stNCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, weopSizer_ == k0 ? n-cclShm>em.cosmm.bueffSiznes[NCdCL_PRbOTO_SIuMPLE]f/NCCL_fSTEPS/,sizeo f(T) : stepSizwe_) { o | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | r group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hk:33:7:->recvbuff, work-> note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here r 33 | e dprims(Otid, pArg, 0, worknthreads, &ring->prev, &ring->next, work-->con>sendnIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunbWuffo, workr->reckvbuffC, worok->reldOplArg, <0, woFrk->connnInd,ex, wo rk->cTonnIn,dex) ; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here RedOp, Algo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64_2, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _SIMPLE_MinMax_f64_4, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreadIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, ws), tidInBlock(threadIdx.x), groupo(rk); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64_2, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_f64_2, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64_4, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64_4, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64_2, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64_4, ncclF/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.huncRe:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]d 670 | u tidc(tid), enthreads,(nthrea ds), tFidInBlocuk(threncMinMax, adIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreadsNCCL_(PROTO_SInMPLE]/NtCCL_STEPhS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), g, 0| , w ^~~~~~~~~~~ork- >connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64_4, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64_4, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 1010 warnings generated when compiling for gfx1201. warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1100. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. [ 80%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp 11 warnings generated when compiling for gfx942. [ 80%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, dIn file included from ata2,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11 : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80f:5: warning: unused variable 'w' [-Wunused-variable] l80 | baarrier_bgy_group(2); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h;:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flaIn file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hg2; | ^~~~~ :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: barrwarning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadI/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ dx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barriIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5:er_by_grou warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ p(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uIn file included from int32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2 warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ , data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: In file included from note: expanded from macro 'barrier_by_group' 29 | const /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hi:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable]n 75 | tbarrier_ w = threadIdx.x/WARPby_group_(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hS:29:15I: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.xZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1,/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, da data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | ta2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145: 21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uuint32_t idata1, fnlag1, datta2, 32_t data1, flag1, data2, flag2; f | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:l28: warning: unused variable 'data2' [-Wunused-variable] 145a | ug2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | int3 2_t data1 , flag1, data2 uint32_t data1, flag1,, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, f data2, flag2; | ^~~~~ lag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: 15/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable]: 80 | barrienote: r_by_groexpanded from macro 'barrier_by_group'up(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: 29:15: note: expanded from macro 'barrier_by_group' 2929 | c | onst in t w = th readIIn file included from const int w = threadIdx.x/WARP_SIZE;dx .x/WARP_\SIZE; \ | ^ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable]flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_2, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_2, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_2, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl() .run(tid , subtn, 497 | warpInBlowocrk); k| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp(:12:1: tnote: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12h | DEFINrE_nccleDevFunac(Redudce_RINIG_SIMPdLE_MinxMax_f8._4, ncxclFuncR/educe,W FuncMAinMax,R rccl_Pfloat8_, NCCLS_ALGO_IRING, NZCCL_PREOIn file included from ), T| O_SIMP/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: LIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from E/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:,670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 4670 | )tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncc ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagTh | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ read((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) {lShm em. comm.| buf ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~fSize s[N CCL_| PROT group(groupO_S IMPL/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hE]/NCCL_STEP:S/si33zeof(:T) 7: s:tepS ize_note: ) in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here{ 33 | prims(t | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing,redO pArgC, 0,O worLk->cLonnI_ndexU, woNrk->RconnIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | OLL> (tid , nth read s, w ork)i; | ^f /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h :432:78(: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested heret 432 | i d if (tid< < s ubtns) RunuWorkbColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReducRunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_2, ncclFuncReduce, FuncMinMax, rccl_floate_RING_LL128_MinMax_f8_2, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, 8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_2, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_4, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_4, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hwarning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_ST/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here EP S/sizeof(T)63 : st | epSiz e_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33 :7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here r 33 | u prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->cnRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:onnIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_2, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_4, ncclFuncReduce, FuncMi nty,M redaop,, a lgor, pcrotco, lunr_oll>f().lruno();a \ t | ^8 , NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthr^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlockead(s),t thidrInBelocak(thdreaIdIddx.xx), .grouxp(gr)oup,), | ^~~~~~~~~~~g roup(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_4, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | In file included from ste/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from p/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175S: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: ifield 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | z tid(teid), nt(hreads(nsthreatepSds)i, wze_ id(t== 0 ? idn%WARPc_clShmem.comm.buffSizeSIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZs[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArE), | g ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498, | fla gThread0((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(u, work-i>connIndenx, work-t>c64_t))o nnIndex{ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here ); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | 33 | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here p432 | if (tid < subtn) RunWorkCollrims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRin().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMdPOp,L PrEoto_LL1M28,i COLnL_UMNROaLL>x(ti_d, fnt8hre_ads2, w,ork ); n | ^c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hc:432l:78:F note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here u 432n | c R ife (tidd ().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:CCL_5ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto:,1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here u 5n | DErFINoE_nlccllDev>Fun(c(R)edu.ce_rRINuG_LnL12(8_)MinM;ax_ f8_\2, ncc l| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid)Fun,cRe ducne, tFunchMinrMaxe, raccld_flsoat(8,n NCtCL_hreads), tiAdLGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdBxatc.h, ualpgo,( prgotor, uonurolpl>()).ru,n() ; \ | | ^ ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32_2, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_10 warnings generated when compiling for host. == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_2, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_4, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cppi:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_2, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ze_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPSIn file included from //builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32_2, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_4, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15::670: 15: warning: initializer order does not match the declaration order [-Wreorder-ctor] note: 670 | field 'nthreads' will be initialized after field 'tidInBlock' tid(tid), nthreads(nth 670 | tid(tid), nthrreads)e, tidInBalockds(nthreads), tidInBlock(thr(thereadIadx.x)d, groIup(dgroupx.x), group(gr),o | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | u tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671p | stepSize(stepSize_ == 0 ), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBloc? nckclShm(em.cotmm.buhffSirzes[NeCCL_PRaOTO_SdIMPLEI]/NCCLd_STExPS/si.zeof(xT) : ), group(stgepSizre_) {oup), | ^~~~~~~~~~~ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32_4, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32_2, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_2, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_4, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Red/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32_4, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grouce_RING_SIMPLE_MinMax_u32_4, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run();/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_4, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthurp(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: buff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_2, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32_2, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: x), group(group)initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIM, | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nPtLE_MinMax_u32_2, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_4, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32_2, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32_2, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL10_PROTO_SIMPLE]/NCCL_STEPS/s warnings generated when compiling for host. In file included from izeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cppt:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11i: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:d498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | < tid( tid), ntshreads(unthreadbs), widt(tid%WAnRP_SIZE)), warp (tid/WARRP_SIZEu), | ~~~~~~~~~~~~~~~~~~ n| stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | W waorpInBlorck(threkadIdx.Coll().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLEad((t_id%4M)==3)i, grounp(groMup), a | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | x warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 _499 | stepSuize(n3cclS2hmem._comm.4buffS,izes[N CCL_PnROTO_cLL128c]/NlCCLFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO__STERPS/siIzeof(Nuint6G4_t)), { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group N/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:C33:7: Cnote: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here L33 | _PROTO_SIMPLE, 4) prims(tid, nthreads, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ &r| ing->p ^rev, &ring/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h->next, work:->s670endbu:ff, w15ork->:recvb uff,note: worfield 'nthreads' will be initialized after field 'tidInBlock'k->re dOpAr g, 0, work670->co | nnInd ex, wo rk->c onnI tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gronduex)p; | ^) /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:,77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | | runRi ^~~~~~~~~~~~~~~~~ng(ti:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ d, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_u32_2, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), groupPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->c(goroupn), n| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | I tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ n671 | d steepSizxe(st,epSi ze_ =w= 0 o? ncrclShmkem.c-omm.>buffcSizeos[NCnCL_nPROTOI_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &rinndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl prevP, &rring-o>nextt, woork-,>sen dbufCf, wOork-L>recvLbuff_, woUrk->NredORpArgO, 0,L work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, worL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RIkN); G| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h_:432:S78: note: Iin instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here M432 | P iLf (tiEd < _subMtn) iRunWnoMax_u32_4, ncclFuncReduce, FuncMinMax, uint32rk_Collt().Grun(Otid,_ subRtn, IwNG, NCCL_PROTO_SIMPLE, 4) | ^ ork); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Min/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Max_u32_2, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:n670:t15:h warning: rinitializer order does not match the declaration order [-Wreorder-ctor] e ad670s | ( n ttidh(tird)e, antdhrsea)ds,(n thtreiadds)I, ntiBdIlnBolocckk(t(hrteahdIrdx.ex)a, dIgrdouxp(g.roxup)),, | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~g r | o tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ u 671p | ( g srteopSuizpe()st,ep Si ze| _ ^~~~~~~~~~~== 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ri/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ ==ng->next, work->sendbuff, work->recvbuff, work 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ->r/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hedOpArg, 0, work->con group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8_4, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:nIndex, work->conn:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | Index); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRingid(InBlotcki(tdhr,ea dIndxt.xh)r,e garodups(g,ro uwork); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIM :P sLtEep_SMizie_)n M{ a | x ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ _ | u group(group 3/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h2:33_:7:2 note: ,in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here n33 | c c l Fpruimns(ctiRd,e ndthrueacdse, ,&r inFg-u>pnrecv,M &irinngM-a>nxex,t, wuorik-n>sten3db2uf_f,t w,or k-N>rCecCvbLuf_f,A wLorGk-O>r_edRING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:OpArg, 0, work->connIndex, work->connIndex); | 611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nth ^ r/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.he:63:5a: note: din instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here s )63 | , truinRdinIgd(tIidd, xnt.hrxea)ds,, wogrkr);o u | p ^ (/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hg:432r:78:o note: uin instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here p )432 | , | if ^~~~~~~~~~~~~~~~~ ( ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hd < :su670b:t60n) RunWorkColl().run(ti: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreadsd,( snubttnh, wrorek)a; d | s ^ )/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp,:12 :1t: inote: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested hered InBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32_4, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32_2, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIIn file included from M/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_u32_2, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ PLE_MinMax_u32_4, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(thre:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), adIdx.| x), gr ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~oup(gr oup), | ^~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32_4, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32_4, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32_2, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32_4, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32_4, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx908. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. [ 80%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ ead, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75173:7: warning: unused variable 'w' [-Wunused-variable] 75: | ba/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hrrier_:75:7: warning: unused variable 'w' [-Wunused-variable] by_ group();75 | | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const i barrier_by_grIn file included from o/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ up(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; nt\ w = thre adIdx.x /WARP_SIZ| E; \ | ^ ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hg:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7r:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ warning: unused variable 'w' [-Wunused-variable] o 75 | ubarrier_bIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ py_gro(up(); | ^~~~~~~~~~~~~~~~~~); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:1529:15: note: expanded from macro 'barrier_by_group': note: expanded from macro 'barrier_by_group' 29 | 29 | c const int w onst in=t w = tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ hreadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp::2: In file included from 11/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: : unused variable 'w' [-Wunused-variable] 75 | In file included from threa/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h dIdx.x/:bWARP_SI174aZE; : \r | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hIn file included from :75:7: warning: unused variable 'w' [-Wunused-variable] 75 | rier_ by_group (In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ); | ^~~~~~~~~~~~~~~~~~ b/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from arri/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.her_by_gr:oup();174 | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:: 29:15: note: expanded from macro 'barrier_by_group' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h :145:14: warning: unused variable 'data1' [-Wunused-variable] 14529 | co | nst int w cons t int w= = thr eadIdx.x/tWARP_SIhZE; \ | r ^eadI dx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t dIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | atau1, fliag1, ndata2t, fla3g2; 2| ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:_145:35: twarning: unused variable 'flag2' [-Wunused-variable] 145 | data1, flag1, d uiant32_tt daa2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21:ta1, flagwarning: 1, daunused variable 'flag1' [-Wunused-variable]ta2, f lag2; In file included from 145 | | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hu:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hi:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:n75:7: twarning: unused variable 'w' [-Wunused-variable] 375 | 2_t data1, flag1, data2, fl a g ba2rrier_;by_gr oup( ); | | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ int32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | conIn file included from s/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ t int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29: | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = thre15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ adIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, daIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: ta2,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_2, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_2, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_4, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_4, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_2, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_2, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_2, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_u64_2, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_2, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_2, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_2, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_2, ncclFuncRIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_2, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ educe, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_u64_2, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_4, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_2, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_4, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_4, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffS/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->nexizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_4, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ t, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_4, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_4, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_4, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_4, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64_4, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1200. [ 80%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1030. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. [ 81%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_2, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_2, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_4, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_4, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_2, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_2, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_2, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_2, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_2, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_2, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_u8_2, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_4, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_4, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_2, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_4, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_4, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_u8_2, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_2, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_4, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/siz/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_4, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_2, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_4, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_4, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8_4, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, daIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ta2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_bf16_2, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_bf16_2, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx908. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. [ 81%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | t10 warnings generated when compiling for gfx1100. id(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtnIn file included from , w/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ringork); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_bf8_2, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbu/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ty>, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx908. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_bf8_2, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 81%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:In file included from 2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:: 2: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14175: warning: unused variable 'data1' [-Wunused-variable] : 145 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h :uint3802_t da:ta1, f5lag1, :dat a2, flwarning: ag2unused variable 'w' [-Wunused-variable] 80 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, 15: note: expanded from macro 'barrier_by_group' 29 | const int w = threaflagd2; I| ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hd:145:x28: warning: .x/WARP_SIZE; \ | ^ unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_f16_2, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, ntIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>(In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nth).run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.reads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? nccx), lgrSoup(ghroupm), e| ^~~~~~~~~~~ m.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSio, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ze_ == 0 ? ncclShmem.comm.buffSizes[NCC 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ L_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_f16_2, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 81%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ : warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flIn file included from ag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_f32_2, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_f32_2, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINEO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ _ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->pr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. [ 82%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] issa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7In file included from : warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hIn file included from In file included from :174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ [ 82%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreadsIn file included from ), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%In file included from WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), gr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.houp(group:670:15:) warning: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cppinitializer order does not match the declaration order [-Wreorder-ctor] 670 | , : tid (tid)2, nthre ad: s(In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670| ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stenthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthrpSize(encclShmaem.comm.buffdSizes[NCsCL_PROTO_L)L128]/,NCCL tidInBlock(th_STEPS/sirzeofeadIdx.x), group(group)(uin,t64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ : 33| : tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here671 | stepSize(step33 | Sprims(tiid, ze_ == 0 nt?hreads, & ncclShring->pmreev, &rm.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:ing->next,33 work->s:endbuff, w7ork->recvb:uff, work ->redOpAnote: rg, 0, worin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested herek->connIn dex, work->conn 33 | Index)p; rims(ti| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hd:77,: nthrea5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here d 77 | s, &ring->prev, &rin rungRingnext,rotoLL128, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_f64_2, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_nccl/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff,DevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduce, FuncPreMulSum, work->recvbuff, work->redOpArg, 0, wor k->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(s/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] tepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if 670 | tid(tid), (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbufIn file included from f, wor/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cppk:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h-:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29:> rwarning: efield 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]c vb uff, work-496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE>redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: ), warp(in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested heretid/WAR P_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_f64_2, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grou tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | In file included from prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclS | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barri/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | er_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_bIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ y_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2In file included from , flag/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:22: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_f8_2, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (In file included from tid < s/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), groupuIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ btn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSizIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(groupe_ == 0 ? ncclShmem.comm.buffSizes), | ^~~~~~~~~~~ [NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_f8_2, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grIn file included from oup),/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2 : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | 173 : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] stepSize(stepS670 | i tid(tzid), nther_ == 0 eads(nth? renacdcls)Sh, mteimd.InBcloomcmk.(buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRin/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hg:670:15<: warning: initializer order does not match the declaration order [-Wreorder-ctor] T 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , RedOp, Proto, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1102. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 82%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gro | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ up(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_u32_2, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_u32_2, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ty>, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 11 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1100. 1010 warnings generated when compiling for gfx1201. warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx908. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. [ 82%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable]In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flagIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_bIn file included from y/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ _group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ E; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uiIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ nt32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable]In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w =In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barr threadIdx.x/WARP_In file included from SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group();i er_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_SIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeoTEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreaf(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkCollprev, &ring->n Algo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_u64_2, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ ext, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PRO/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hTO_S:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]I 670 | M tid(tid)P, nthreaLds(nthreaEds), tid]/NCCL_SInTBlock(thEPS/sizeof(Tre)adIdx .x), : sgrotepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7:up(g roup), note: | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here671 | st epS 33 | pize(strepSize_ i=ms= 0 ? ncclSh(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff,m em.commw.buffSizeos[NCCL_PrROTO_SkIMPLE]/NC-CL_STE>PS/sizeofr(T) : steepSize_)dOpArg, 0, { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ w | group(groupork->connIndex, wor k/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:-33:7: >note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here c33 | o pnnIndrims(etx); id, n| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hthrea:ds63:, 5&: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRingprev, L&ring_->next, work->sendbuff, work->recvbUNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here u ff, work-432>redO | pArg, 0, w o if r(k->ctonnInidex, dwork-> connI, ProtoSimple<1, 1, 4>, 4>' requested here ll().run(tid, subtnL>(,tid , nwthroeadrs, kwor)k);; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | | D ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hE:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested hereF I432 | N E _ if (tid < sncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_2,ubt n) nRuncWorckColllF(L).rGun(Otid_, sRubtIn, NworGk);, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:12:1N: note: Cin instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here CL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc'12 | DE FIN611E_n | ccl De vFun c(R educe_RRINGu_SInMPLWE_PoreMrulSkuBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthrreMuelSuam, duinst64(_t,n NCCL_ALGOt_RIhNG, rNCCeL_PaRdOTOs_SI)MPL,E, 4 ) t | ^i /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hd:611:62: note: Iexpanded from macro 'DEFINE_ncclDevFunc' n611 | B l RuonWocrkBkatc(h,, a lgo , p| rot ^~~~~~~~~~~~~~~~~o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthrea, udnrosll>((n).rtun(h); \r | e ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.ha:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), ds), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : ste:60: note: field 'group' will be initialized after field 'stepSize' 670pSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here | tid(tid), nthrea 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduce, FuncPreMulSum, uint64_t, NCds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ CL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unrIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndeoll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ x, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_u64_2, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ :63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().rIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(thrun(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_2, ncclFeuadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreadncReduce, FuncPreMs, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlo/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCck(threadIL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here In file included from 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduce, FuncPreMulSum/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:,2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h: 11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:u173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:i670:15: nwarning: initializer order does not match the declaration order [-Wreorder-ctor] t670 | 6 ti4d(tid_), nthtreads,(nthr eads)N, tidICnBlocCk(thrLeadId_x.x),A groupL(grouGO_RING, NCCL_PROTO_SIMPLE, 4) | p), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_S^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~IMPLE]/NCC L_ST/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hEPS/size:of(670T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work-:>60: cnote: ofield 'group' will be initialized after field 'stepSize' n670 | n Itidn(tid), nthreads(nthreads), tidInBlock(threaddIex,d woxrk-.>coxnnI)n, group(group), | ^~~~~~~~~~~ dex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1101. [ 83%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1102. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ [ 83%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t daIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ta1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/s/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ izeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h498 | flagThread(In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here (tid%4)==3), group(gr:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthr 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432o | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ up), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t))eads) , tidIn{Bloc k(thread Idx.x)| , grou ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~p(group ), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ | 671 | group(groupstep Size(stepSize_ == 0 ? ncclShmem/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h.comm.buffSizes[NCC:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | L_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->: stecpSizeo_) { n | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ n | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hI:33n:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested hered 33e | x pri,ms(ti d, ntwhreados, &rring->pkrev, -&>ring->nceoxntnIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77,: work5->sen:dbuff , wornote: k->rin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested hereec v bu77f | f, w runork->rReidOngconnIndexRedOp, ProtoLL128, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl,connI ndex)A;lgo, Pro | t ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:o63:5: note: ,in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | C OrunRiLng(tOid,L nthreads, Lwork);> | ^ (/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78): note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_u8_2, ncclFuncReduce, FuncPreMulSum, uin tT, Re8dOp, _Algo,t Prot,o, COL L_UNNROLCL>C().run(tid, sLubtn,_ work)A; | L ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cppG:12:1:O note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here _12 | DEFRINE_ncIclDevFNunc(RGeduce,_RING _SIMPNLE_PrCeMulSCum_u8_L4, n_cclFuPncRedROTO_LLuce, FuncPreMulSum, uint8_t, NC128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, CpL_ALGrO_RINoG, NCtCL_oPR,OTO_S IMPLuE, n4) | r^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:o611:62l: note: expanded from macro 'DEFINE_ncclDevFunc' l 611> | () . r un(); \ | ^ RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTIn file included from O_S/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11I: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hM:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] P670 | L tidE(tid), ,nthr 2ea)ds (n| t^ hr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.he:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | Rads), tidInBlock(threadIdx.unWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | x ), gro up(gro up), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_t 671 | i sdtepSi(ze(stepSize_ == 0 ? tncclSihmem.cdomm.bu)ffSize,s[NCCL_ PROTO_nSIMPLtE]/hNCCreads(nthreads), tidInBlock(threL_aSTEPS/dsizeofI(T) : dstepSixze_) { . | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ x), group(group), | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15:runRin g(tid, nthr670eads, | work); tid(t| ^i /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432d:78:), nnote: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432threads(nthreads), tidInBlock(threadIdx | . ixf (tid) < s,ub tn) RugnWorkCorll().run(tid, substepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(ttin, wordk); ,| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp: 7:1: nnote: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7t | DEFhINE_ncclDervFunec(Reduace_RING_SIMPLdE_PresMulSum,_u 8_2, n&cclFunrcReducie, FunncPreMulgSum, u-int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE,>prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | 2) | r^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' u611 | n RRunWorikBatchn, ,algo, p roto, uRnroll>e().rdun()O; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:p15: note: field 'nthreads' will be initialized after field 'tidInBlock' ,670 | t id(tiPdr),o tnot,h rCOLL_UNROLL>(teads(nthreads), tidInBlock(thrid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, eadIsdx.x),u groupb(groupt), | ^~~~~~~~~~~~~~~~~n /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h,:670: work);60: note: field 'group' will be initialized after field 'stepSize' 670 | | tid(t ^id), nth/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cppreads(nthreads):, tid12InBl:ock(th1readIdx.x), :grou p(gronote: up), in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here | ^~~~~~~~~~~ 12 | In file included from DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ h671s, altgo, preotpo, uSnroll>i().ruzn()e; \ ( | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hs:670:15t: enote: field 'nthreads' will be initialized after field 'tidInBlock' p670 | S tiid(tid), nthreadsze_ == 0 ? ncclShmem.comm.buf(nthreads), tidInBlock(threadIdx.x), group(grofSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduceup),_ | R ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hI:670:60:N note: field 'group' will be initialized after field 'stepSize' G670 | _ tid(tSid), InthrMeads(PnthreLads),E tidI_nBlPock(trhreadeIdx.x)M, grouup(groulp), S| ^~~~~~~~~~~ um_u8_2, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_u8_2, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PRO: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]TO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx./NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIx), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | In file included from bar/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:r2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:i174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: ewarning: unused variable 'w' [-Wunused-variable] 75 | r ba_rrbiye_rgr_boupy_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | c()o; | n ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15s: note: expanded from macro 'barrier_by_group' t29 | consti int w n=t w threadIdx.x/WARP_SIZE; \ | ^ = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | threadIdx.x/WARP_SIZE; \ | ^ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_2, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_2, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_bf16_2, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_4, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_2, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreaIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_2, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_4, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_tIn file included from )) /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: {In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: 173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670 :15: | warning: initializer order does not match the declaration order [-Wreorder-ctor] ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | 670 | tid(ptid), rnthreadis(nmthreadss(tid, nthreads, ), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepS&ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->conize_ n== 0 ?I ncclSnhmem.cdomm.bueffSizexs[NCCL)_PROTO;_SIMPL E ]/NCCL_S| TEP ^S //builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hsiz:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runeoRf(T) :i stepSnize_) {g | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ <| T group(group, RedOp, Prot/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &rionLL128,g COLL_-UNROLL>>(tidn, nthreeads, xwork); t | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h, :432:78: note: win instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here o 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:5:1:rk- >sendbnote: uff, win instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested hereork->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthrea d5 | DEsFINE_,ncclDev Func(wReduce_oRING_LrL128_Pkrod)_b;f | ^ 1/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h6_2, :ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 432:61178: note: | in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | i f (t Rid < suubtn) nRunWoWrkoColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_2, ncclFuncReduce, FuncProd, hip_y, redop, algo, proto, unroll>().run(); \ | ^ bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_2, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_2, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_2, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_2, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_2, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCC/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_4, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ L_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_4, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_4, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_4, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_4, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_4, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_2, ncc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tlFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ id), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, w/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSiork-z>connIndeex); | _ ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h: 63:5: =note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | = runR ing(ntid, nthreads, work); | c ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: cin instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here l S432h | m e m . c oif (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring-o, Pr>oto, nCOLL_eUNROLxL>().tru,n(tid, subtn, work);w | o ^ r/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:12:k1: note: -in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12> | DEFINEs_ncclDevFunc(Reeduce_nRING_dSIMPbLE_Prod_bf16_4, ncclFuncReduce, FuncProd, hip_bfloat16, NCCLuff_, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreadnote: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, ws(ntohreadsr), tidkInBlo)ck(th;r ead Idx| .x), ^group (group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp670 | tid(tid:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here ), nthre12ads | (DEFINE_ncclDevFunc(Reduce_RING_nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ SIMPLE_Prod_bf16_4, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16_4, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1102. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 83%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1101. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 83%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_byIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_2, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_2, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_2, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_bf8_2, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_2, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_2, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_4, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_2, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_bf8_2, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreanext, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_4, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ds, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_2, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_4, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_4, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_2, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group),id), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_2, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_2, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_4, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_2, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_4, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_4, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gro/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_4, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_4, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_4, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8_4, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | constIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_2, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_4, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_2, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_2, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_f16_2, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_2, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hd, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_2, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_4, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_4, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkCollNpRrOeLvL,> (&)r.irnugn-(>tniedx,t ,s uwbotrnk,- >wsoernkd)b;u f f| , ^ work-/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp>:r7e:c1v:b unote: fin instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested heref , work->r e7dO | DpEAFrIgN,E _0n,c cwloDrek-v>Fcuonncn(IRneddeuxc,e _wRoIrNkG-_S>IcMoPnnLEI_nPdreoxd)_;f 1 6| _ ^2 , ncclFuncRed/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hu:c63e:,5 :F unote: nin instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested herec Prod, h al63f | , N C CrLu_nARLiGnOg_| (^t id, nt/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hh:r611e:a62d:s ,note: expanded from macro 'DEFINE_ncclDevFunc'w ork); 611| | ^ RunWor/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hk:B432a:t78c:h , 1, 2, 2>::run' requested hereo ll, ty, r432ed | o p < t y >,i fa l(tgiod,

o(r)k.Croulnl(<)F;n ,\ T ,| ^R edOp, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hA:l670g:o15,: Pnote: rfield 'nthreads' will be initialized after field 'tidInBlock'o to, COL L670_ | U N R O LtLi>d(()ti.dr)un,( tnitdhr,e asdusb(tnn,t hwroerakd)s;), t| i ^d InBlock(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cppt:h7r:e1a:d Inote: din instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested herex .x), grou p7( | gDrEoFuIpN)E,_ n | c ^~~~~~~~~~~~~~~~~c lDe/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hv:F670u:n60c:( Rnote: efield 'group' will be initialized after field 'stepSize'd uce_RIN G670 | _ S I M PtLiEd_(Ptriodd)_,f 1n6t_h2r,e andcsc(lnFtuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_f16_2, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_4, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_2, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_2, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_2, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_4, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_2, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_4, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_4, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_4, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_4, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_4, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16_4, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1201. 1010 warnings generated when compiling for gfx906. warnings generated when compiling for gfx1030. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 84%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp 11 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ [ 84%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174In file included from : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :75:7In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ : warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_2, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_2, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_2, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_2, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_4, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_2, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_f32_2, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_f32_2, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_2, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_4, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' , &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_4, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_2, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_2, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_4, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_2, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_4, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_2, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>():670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] .run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_4, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_4, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ =/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthread= 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_2, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ s), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_4, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_4, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_4, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32_4, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, dIn file included from ata/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp2:,2 : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] f 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ lag2; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_2, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | : warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nth499reads(nth | reads stepSize(ncclShmem.comm), tidInBlock(thr.eadIdx.xb)u,f fgSriozueps([NCCL_PRgroup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSiOTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->senze_ == d0 ? ncbclShmem.ucomm.bufffSizes[NCCL_PfROTO_SIM,PLE]/N CCL_STEwPS/sizeoof(T) r: stepkSiz-e_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group >/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33recvbuff, work->redOpAr:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, wog, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | ifrk->s end(buff, twork-i>recvdbuff, work<->red OpArg,s 0, wuork->bconnItndenx, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work);) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128 | ^ _P/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432r:78:o note: din instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here _432 | f 6 if4 (tid_ < s2ubtn,) Ru nWnorkCocll(e).ru,n(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncc FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:lDe62vFun:c(Re ducenote: _RINexpanded from macro 'DEFINE_ncclDevFunc' 611 | G _SIMPLER_uPnroWd_fo64_4r, nkcclBFuantcRedcuh, algo, proto, unroll>().run(); \ | ^ ce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_2, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_f64_2, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_2, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_2, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_2, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_4, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_2, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthrePLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connInads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, suIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173btn, : work);/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h | ^: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp670:7:1: :note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 715 | DEFINE:_ncclD evFunc(Reducwarning: e_Rinitializer order does not match the declaration order [-Wreorder-ctor]I N G_S670 | tid(tid), nthreads(nthreads),IM PLE_Prtod_f64_i2, nccdlFuncRIeduce, nFuncPrBod, doulbock(threadIdx.x), grle, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' oup(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | 611 | RunWo rkBatc h, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hprims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5:670:: 60:note: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested herefield 'group' will be initialized after field 'stepSize' 670 | tid(tid), nt63hrea | ds(n threa ds), tidI nBrlock(thrueadIdx.x), ngrouRp(grioupn), | g ^~~~~~~~~~~< T, RedOp, Proto, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_2, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_2, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_2, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_4, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_2, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_4, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | prims(tid, nthreads, tid(tid ), nthrea&ds(nthreraing->prev, &ring->next, work-ds), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ >sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); 671 | | ste ^pSize(s tepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PR/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hOTO_SIMPLE:]/NCCL_63STEPS/s:izeof(T5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing) : s, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, L>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(&tring->iprev,d &ri,ng->next, wo rk->ssendbufuf, worbk->rectvbuff,n work->,redOpA rg, 0,w work->oconnrIndex,k work-)>connIn;dex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63 :5 : | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:12:1: note: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_4, ncclFuncReduce, FuncProd, double, NCCL_ALGoO, C_OLL_UNROLRL>(tid, Inthreads, worNk); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:G78: note: ,in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | N iCf C(tid ().run(tid, subtn, woll, ty, redop, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grourk); | ^ p(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_4, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_4, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_4, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->r/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->pecvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_4, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ rev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_4, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64_4, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 84%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1100. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. [ 84%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' In file included from 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_2, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_2, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_2, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ 33 | prims| (tid, nt tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_hreads, &ring-> prev671, &ri | ng->next, work-> sendbuff, work->r ecvbuffs, twork->reepSizedOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: (stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_4, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, u&ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_2, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_2, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPL/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidIE_Prod_f8_4, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_4, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_4, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, wIn file included from ork->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | st432 | if e(tid < subptn) RunSWorkCoill().erunm(tid, s.ubtn, cworok)m; | ^ m/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp.:12:1:b note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested hereu f 12 | DEFINE_ncclDevFunc(RefSdizes[uNCCL_PRcOTO_SIeMPLE]/_NCCL_SRTEPSI/NsGi_zSeIoMPf(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &LEr_Prodi_f8_4, nncclFugncR-educe>, FuncProdn, rccle_floxat8, NtCCL_,ALGO _RING,w NCoCL_PROrTO_SIMPkLE-, 4) | >^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611s:62:e ndbuff, work->recvbuffnote: ,expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unrwoork->reldOpArgl, 0,> work-(>co)nn.Inderxu, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nock(thtreadIdx.x)h, greads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hroup(grou:p), | 432 ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670::60: note: field 'group' will be initialized after field 'stepSize'78 670 | : note: tin instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here id(tid), nthreads(nthreads), tidInBlock432( | t if h(tidr < seubtna) RunWorkColl().run(tid, subtn, work); dIdx.x), gro| u ^p(grou p), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_2, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_2, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_f8_2, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_4, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_2, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_4, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_2, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_2, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_4, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), groIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]up(group), | ^~~~~~~~~~~ 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_f8_2, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_2, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_P/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads),:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidtInBlocik(thredadIdx.Ix), grnoup(groBup), l| ^~~~~~~~~~~~~~~~~ o/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' c670 | k (tthidr(eatdIdx.x), group(group), | i ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~d), nthread s( nthrea| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ds ) 671 | stepS,i tidInzBlock(teh(resatepSize_ == dI0dx.x) , grou?p ncclShmem.comm.b(group), u| ^~~~~~~~~~~ ffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_4, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_4, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8_4, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = thrIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrieadeIdx.x/WArRP_SIZE_; \ | ^ by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_2, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_2, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_4, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_2, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_4, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_2, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_2, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_4, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_2, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_2, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_4, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_4, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().10r warningusn generated( when compiling for hostt. id, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_u32_2, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_4, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_u32_2, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(th:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tireadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_4, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ d), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_2, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_2, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_2, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_2, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_4, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_4, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5 work); : note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_4, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadId| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32_4, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ x.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx908. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. [ 85%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp 11 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ [ 85%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrieIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ r_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: | ^ warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: :75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 145 | uint32_t data1, flag1, data2, flag2; | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145: ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h14:145:28: warning: unused variable 'data2' [-Wunused-variable] : 145 | u int32_t dwarning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2ata1,; flag 1, d ata2,| flag ^~~~~2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable]: 145 | 145 ui:nt32_21t da:ta1, flag1warning: , datunused variable 'flag1' [-Wunused-variable]a2, flag2; 145 | uint32_t dat| ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = ta1, hflag1r, datea2, falag2;d | ^~~~~ I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:d145:28: xwarning: unused variable 'data2' [-Wunused-variable] 145. | uxint3/2_t daWta1, Aflag1R, datPa2, f_lag2; S | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ IZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp: | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h2:29:15:: note: expanded from macro 'barrier_by_group' In file included from 29 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h co:nst11 int : w =In file included from thr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.headIdx:.x/WA175RP_S: IZE; /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h\ | ^: 80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64_2, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here In file included from 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64_2, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunW/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.ho:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:r173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15k: warning: initializer order does not match the declaration order [-Wreorder-ctor] B670 | a tid(ttid), ncthreadhs(nthre, algo, protothreadIdx.x), groIn file included from u/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work-p(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(ste>connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_u64_2, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ pSize_ == 0In file included from ? ncclShm, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hem.comm.:bu670ffS:izes60[NCC:L_P ROTO_note: SIMfield 'group' will be initialized after field 'stepSize'PLE] /NCC L_STEPS670/siz | eof( T) : s tepS ize_t) { i | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~d(tid), nthreads(nthreads) | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | s,t tideInBlopck(tShreadiIdx.zx), egrou(p(grosup),t | ^~~~~~~~~~~e pSize_ == 0 ? ncclShmem.comm.bsendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRingSize(s[NCtCL_PiROTOd_SIMP,LE]/ NCCLn_STEtPS/shizeorf(T) e: staepSidze_)s { ,| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ work); | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->rec| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Revbudff, uworck->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); e_R ING_| SIMP ^LE_P rod/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h_u64_2, :432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | i f (tRidun , algo,_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64 proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | _2 , nc cltFuincdRed(utcei, dF)unc,Pr odn, tuhintr64e_ta, dNCsCL(_AnLGtO_hRIrNGe, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: aexpanded from macro 'DEFINE_ncclDevFunc'ds ), tid611 | In Bl oc k( thRreunWorkBatch, algo, proto, unroll>().run(); \ | ^ adIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64_2, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64_4, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ 5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_u64_2, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64_2, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, suIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | rbtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64_2, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64_2, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ O_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch,unRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64_2, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work- n>thrreadse(ntchrevadsb), utidfInBflock,(th reawdIdox.xr), kgrou-p(grou>p),r | e ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | d tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ O671 | p A srtg, 0, work->connIndex, work->connIndex); epSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here r o33 | t o prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work-, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_>SconInInMdexP); L | ^E /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h_:63P:5:r note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested hereo d63 | _ urun6Rin4gc(tilFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RId, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64_2, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grokBatch, algo, proto, unroll>().run()up(group), | ^~~~~~~~~~~ ; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' go, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64_4, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->p/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hr:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64_4, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64_4, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(thIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), readId| x.x), g ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~roup(gr oup), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.c/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(groupomm.)buffS,izes[N CCL _PROT| O_SIM ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~PLE]/ NCCL_ STEPS| /siz tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_eof(T ) : stepSize_)671 { | | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group stepSize(stepSize_ == 0 ? ncclShmem.comm.buf/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hf:33:S7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here i 33 | z perims(stid, [nthrNeads, C&ringC->prev, &ring->next, work->sendbuff, L_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, wor&k->rrecvbiuff, nworkg->r-edOp>Arg,n 0, ework-x>contnInd,ex, workw->coonnIndrex);k -| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5>: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested heres 63e | n runRdingrecvbuOLL_UNROLL>(tid, nthreads, work); | ^ ff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing, 1, 2, 4>::run' requested here _432 | U iNf (tRidO < sLubtnL) Ru>nWor(kColtl()d.runs(tid,, su btn,w worork); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78k); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, wor_kRING)_SIM;PLE_ Prod_ u64| _4, ^nccl Fun/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cppcReduce, F:uncP7rod,: uin1t64_:t, N CCLnote: _ALGin instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested hereO_ RING , NCCL7_PRO | TO_SDIMPLEE, 4FINE_ncclDevFunc(Reduce_RING_SIMPLE_P) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, prod_u64_2, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ edop, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64_4, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64_4, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p, Proto, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64_4, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64_4, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64_4, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_u8_2, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_2, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_2, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_2, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_2, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_4, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_4, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/N/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, wCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_2, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ork); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_4, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_4, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthre:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_2, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: ads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_2, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_2, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_2, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_4, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_u8_2, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_4, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_4, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_2, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_2, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_4, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_4, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_4, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8_4, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1102. 1010 warnings generated when compiling for gfx906. warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1101. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 85%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | consIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ t int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:2911: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h | :173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7 : warning: unused variable 'w' [-Wunused-variable] 75 | c boarrnier_sby_gtroup (); i | ^~~~~~~~~~~~~~~~~~ n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:t15: note: expanded from macro 'barrier_by_group' 29w | con= threadIdx.x/WARP_SIZE; \ | ^ st int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WA | R P bar_rierS_by_IgroupZ()E; | ; ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h :29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145In file included from | uin/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cppt:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h3:11: In file included from 2/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:_174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:t145:14 : warning: unused variable 'data1' [-Wunused-variable]d 145a | t uinat32_1t da,ta1, flagf1, dlag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, afta2,l flaag2; g | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h1:145:21,: warning: unused variable 'flag1' [-Wunused-variable] 145d | auintt32_ta data21, f,lag1 , dafta2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flagIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint3lag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 2_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, daIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ta2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = th/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flraeadIgdx.x/2WARP;_SIZ E; \ | ^ | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, 671work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBIn file included from lo/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cppc:k2(: tIn file included from h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.hr:e11a: dIn file included from I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hd:175x: ./builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.hx:)498,: 29g:r owarning: ufield 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]p (group), | ^~~~~~~~~~~ 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_bf16_2, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ [ 85%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | epSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_bf16_2, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RIN/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSiG, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ zes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tidkBa(tch, algo, prdoto, unr)oll>().,run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hn:670:15:t note: field 'nthreads' will be initialized after field 'tidInBlock' 670h | tird(tid),e nthreads(ads(nthreads), tidInBlock(threadIdx.x), groupnthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34: note: field 'group' will be initialized after field 'stepSize' 7 670 | : tid( tid), note: nthreain instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested hereds(nth reads) , tidInBlock(34thread | Idx.x ), group (group ), | ^~~~~~~~~~~ prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group10 warnings generated when compiling for host. (group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_2, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16_4, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cppIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_bf8_2, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_bf8_2, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid),In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScat nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ter_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group)In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here, | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSiIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ zes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34: 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_2, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthrea/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_4, ncclFuncReds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ duceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | Run/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduceScatter, FuncMinMax, rccl_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ duceScatter_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run()bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8_4, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1030. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 86%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barri barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from er_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARPIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); 11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:_SIZE; \ | ^ 5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, datIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = thread:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | Idx.x/WARP_SIZE; \ | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28:a2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ rier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_2, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_2, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(step/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_2, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_4, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_2, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), groupIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_2, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_f16_2, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_2, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_2, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_2, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &rIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_2, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | Ruing->prev, &ring->next, work->sendbuff, work->recvbuff, wnoWrorkk-B>atrcehd>,c oanlngIo,n dperxo,t ow, ournkro-l>lc>o(n)n.Irunnd(e);x )\; | ^ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79n:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_f16_2, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ threads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_4, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_2, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_2, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_4, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_4, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_4, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->rec/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRingredOpArg, 0, work->connIndex, work->connIndo, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:e432x:)78;: note: | in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here ^ 432 | if (tid < subt/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.hn:)65 :R5un:W onote: rkin instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested hereC ollC(O)L.Lr_uUnN(RtOiLdL,> (stuibdt,n ,n twhorreka)d;s , | w ^o rk); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: 12in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here | DEFINE_n c432c | l D e v F un ci(fR (etdiudc en(c)M.irnuMna(xt,i dh,a lsfu,b tNnC,C Lw_oArLkG)O;_ R I| N ^G , NCCL_PROT/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cppO:_12S:I1M:P Lnote: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested hereE , 4) | ^ 12 | DE/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hF:I611N:E62_:n cnote: cexpanded from macro 'DEFINE_ncclDevFunc' lDevFu n611c | ( R e d uRcuenSWcoartktBeart_cRhI6,_ 4a,l gnoc,c lpFruontcoR, eudnurcoelSlc>a(t)t.erru,n (F)u;n c\M i n| M ^a x, half/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h,: 670N:C15C:L note: _field 'nthreads' will be initialized after field 'tidInBlock'A LGO_RING ,670 | N C C L _tPiRdO(TtOi_dS)I,M PnLtEh,r e4a)d s (| n^t hreads),/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h :t611i:d62I:n Bnote: lexpanded from macro 'DEFINE_ncclDevFunc'o ck(thr e611a | d I d x. xR)u,n WgorrokuBpa(tgcrhofield 'group' will be initialized after field 'stepSize', algo, 670p | ro t o , tuindr(otlild>)(,) .nrtuhnr(e)a;d s\( n t| h ^r eads), tidIn/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hBl:o670:c15k:( thnote: rfield 'nthreads' will be initialized after field 'tidInBlock'e adIdx. 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_4, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_4, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RI/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInNG, NCCL_PROTO_SIMPLBlE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_4, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16_4, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1200. [ 86%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdIn file included from x.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ uint32_t data1, f uinlt32_at dagta1, 1flag,1, d ata2d, flaag2;t | ^~~~~a /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:1452:35:, warning: unused variable 'flag2' [-Wunused-variable] 145 | f luiant32_gt 2data;1, fl ag1 , da| ta2, ^~~~~flag 2; /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h| ^~~~~ :145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadI d barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ x.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] In file included from 145 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32_2, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:n2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.ht:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:h173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:r670:15: ewarning: initializer order does not match the declaration order [-Wreorder-ctor] a670 | d tid(tsid), )nthre,ads(nt hreadts), tiidInBdlock(IthreandIdx.Bx), glroup(ogroupc), | k ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_( 671 | t sthepSizre(steepSize_a ==dIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPL | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeE]/NoCCL_fSTEP(S/sizTeof()T) : ste:pSiz e_) s{ | t ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(groupe /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.hp:34S:7:i note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here z 34 | e _ pri)ms(t id, {nthre ads, &ring- >pre| v, & ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ri | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prevng->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connInde, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRingcon nInPdexr); o | ^t /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.ho:65,:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here C 65 | O L ruLnRi_ngLL_(UNRtOLLi>(tdid, ,nth reands,t wohrk)r; e| ^ a/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:d432:78s: note: ,in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | w o irf (ktid) < subtn) RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7_ | UNDROELLF>(I).NruEn(_tind,c scubltnD,e wvorFk)u; n | ^c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp(:R7:ed1:u note: cin instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here e S7 | DcEFaINtE_tnceclrDe_vFRunIc(NReGdu_ceSScIatter_RING_SIMPLE_MinMax_f32_2, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_MPLE_MinMax_f32_2, ncclFuncReduceScatterSIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32_2, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32_4, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32_4, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32_4, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32_2, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_f32_2, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32_2, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | PsROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hf32_2,: 670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->ncclFuncReduceScatter, FuncMinMax, float, connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32_4, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32_2, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for gfx942. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Red/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hu:c670:15e: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | S ca ttid(ttid)e, nthrerads(_ntRhreIadNG_SIMPLE_Mins), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSiMaxz_f3e2_(4, sncctlFuencRpeduSceSicazte_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/ter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here p34 | r o tprioms(,tid , unroll>().run(); \ nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65 :5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32_4, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^L>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn ,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nth work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFIreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32_4, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_f32_2, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32_2, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32_2, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(ntnote: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grouph)reads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32_2, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCC(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ L_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32_4, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 86%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32_4, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32_4, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h| ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32_4, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from 29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_In file included from by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flaIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ g1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, daIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: tIn file included from a2, fl/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: ag2; | ^~~~~In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h35: :174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hwarning: unused variable 'flag2' [-Wunused-variable] 145 | : uint3275_t data1,:7: flag1, data2, flag2; | ^~~~~ warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flagIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_f64_2, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_2, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_2, ncclFuncReduceScatter, FuncMinMax, double, tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_2, ncclFuncReduceScatteNCCL_ALGO_rR, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tidIn file included from (/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_2, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : step/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_4, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Size_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorIn file included from kColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cppR:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_2, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ING_SIMPLE_MinMax_f64_2, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_4, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | work tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevF->sendbuff, work->recvbuff, work->redOpArg, 0, work->connInudnc(ReduceScatter_RING_SIMPLE_MinMax_f64_4, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_4, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_4, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_4, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/siz670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads)eof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here , tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_2, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_2, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_2, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nt note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | hreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_2, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670 if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceSc:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tatter_RING_LL128_MinMax_f64_2, ncclFuncRedu:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | idR(tid),u nthrneads(ntWhreadso), tidIrnBlock(kthreadIBdx.x), agroup(tgroup)c, | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ h | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671< | sctepSizoe(steplSize_ l== , ty, redop, algo, proto, unroll>()0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSi.run(); \ | ^ ze_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_4, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_4, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | r ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(guroup),nRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_2, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nt | ^~~~~~~~~~~ hreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_4, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx908. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_4, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx906. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64_4, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1030. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 86%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp 10 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const In file included from int w = threadIdx.In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | bax/WARP_SIZE; \ | ^ 2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from rrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint3In file included from 2_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_2, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_2, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_4, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_2, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for gfx942. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:)2: .In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:r11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hu:173: n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:(15t: warning: iinitializer order does not match the declaration order [-Wreorder-ctor] d670 | , tisd(tuid)b, ntthrnea, work);ds(nthreads), tidInBlock(threadIdx.x), group(group) ,| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp :12:1| : ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEF| INE tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize__nc clD evFunc671(Red | uce Sca tte r_R INGs_SItMPLepSizeE_M(instepSize_ == 0 ?M axn_fc8_c4, nlccSlFhunmcReedmu.cceSocamttmer., bFuffSizes[NuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE,CC L_4PR)OT O_ SIMP| LE^]/ N/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hCCL:_S611TE:PS62/s:iz eonote: f(expanded from macro 'DEFINE_ncclDevFunc'T) : st611ep | Si ze _) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | R un Wo rkpBartcihrepdorpv, ,al go&, rpriotno,g u-n>ronlle>(xt, work-)>.rs10une( warnings generated when compiling for host. n);d \b u| ^f /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hf, work->r:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ecvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_2, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_4, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_2, ncclFuncReduceScatter, FuncMinMax, rccl_float8, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.NCCL_ALxGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_4, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_2, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 87%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_4, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_2, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_f8_2, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_2, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScattIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(ger_RING_SIMPLE_MinMax_f8_4, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ roup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_2, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_2, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_f8_2, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_4, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_2, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (ti&ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | d < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here run 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_4, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Ring(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_4, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_4, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8_4, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ _t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_2, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_2, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_4, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | primProto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_2, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | s(tid, nthreads, &ring->prev, &ring->next, wo^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ rk->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_4, ncclFuncReduceScatter, FuncMIn file included from inMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadI/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_u32_2, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) dx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads)| ,^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_2, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem. | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | c stepoSize(stmepSize_m == 0 ? .ncclShmbem.commu.buffSizfes[NCCfL_PIn file included from SizROeTO_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:s2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.hS:11[: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173I: N/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15M: Cwarning: initializer order does not match the declaration order [-Wreorder-ctor] PC670 | L_PROTO_LL128]/NCCL_STEPS/sizeofLE(]/NCCLu_STEPS/siizeof(Tn) :t6 step4Size_) _{ tt| id(ti)d) ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~, nt)hr eads( n{ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34| group(group | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h: 34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prim s(tithrdeads),, tidI nBlocnk(thrteadIdxh.x)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:12:1: note: r, groeup(groaup), d | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | s tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ ,671 | stepS&irinze(stepSize_ == 0 ? pr ims(tnid, nthreads, &ring->prev, &ring->ng->preev, &xringt->ne,xt, w orkwork->sendin instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested hereb 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_4, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatchs-end>buff,r weork->crecvvbuff, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , work->redbOuff, pwork->AredOrpArg,g 0ccl,,Shme m .co0mwm.b,ouf frSiwzekos[NCrCL_-kPRO>-TO_c>SIMPcoLE]on/NCnnCL_nISTnEPS/dIsizeenofx(dT),e : sx tep,wSiz oe_) wrork->ck->oconnnInnIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | dex) ; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h :65: 5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here r 65u | n ruRing, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested hereo , COLL_UNROLL34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbufotoLL128, COLL_UNROLL>(tid, nthreads,>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_2, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grou work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tidf, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7: < subtn) RunWorkColl, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_2, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tiedOp, Algo, Proto, COLL_UNROLL>().run(tid, subtn, workp), | ^~~~~~~~~~~ ); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128dInBlock(thre_MinMax_u3adIdx2.x), group(group), | ^~~~~~~~~~~ _2, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gro/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2u: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from p/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:(15: warning: initializer order does not match the declaration order [-Wreorder-ctor] g670 | tidr(tid), nothreadsu(nthreadps), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~) , tid | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSInBloick(threzadIdx.ex)(ste,p groSize_up(g rou==p) 0 , | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROT? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, wO_SIMoPLE]/NrCCL_STEPkS/size-of(T) >: stepSisze_) { e | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | n group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34d:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here b34 | u prims(tfid, nthfreads, work, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthread->consnIndex,, wor k->cownnIndeox); r| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.hk:65:5:) note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here ; 65 | run Ring<| T, Red ^Op, Pr /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (toto, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) Ruidn < Wsubotn)r RuknWorCkCoolll().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Redp, uAlgco, eProSto,c COaLtL_UtNROeLL>r()._run(RtidI, sNubtn, woGrk)_; S| ^ I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cppM:7P:1: Lnote: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here E 7_ | DEMFINEi_nMax_u32_2, ncclFuncRncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_2, ncclFuncReduceScatter, FuncedMuceiScatnterM, Fauncx, uint32_t, NCCMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, protL_AoLGO,_R unroll>I(NG,) NC.CL_rPROuTO_SIMPLnE, (2) )| ^ ;/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h: 611:62\: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | | RunWork ^Bat c/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hh, algo, proto, unrollfield 'nthreads' will be initialized after field 'tidInBlock'> (670 | ) .tidr(tuid)n, n(thr)ead;s(nt hre\ads ), tid| I ^ nB/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tidl(ockt(thireadd), ntIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthhreards(nethraeadds),s ti)dIn,Blo ck(tthrieaddIdxI.x)n, gBroulp(goroucp), k(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_2, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/siz/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671eof(T | ) : st epSize_ ) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h :34:7: snote: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | t preims(pSize(tids, ntthepSize_ == 0 ? ncreads, c&ring->lIn file included from p/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_2, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ revShmem.comm.buffSizes[NCCL_PROTO_, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connInSIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring-d>ex); n | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.he:65:5x: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here t 65 | , ru nRingw_UNROsLendbuffL>(t,id, n twork->recvbuff, wohrreads,k work)-; | ^> /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432r:78:edOpArg, 0, wor note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkCollconnInd ex, wCork->cOonnInLdex);L | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (t_iUNROLdL>(). run<(tid, subtsn, woruk);b | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cppt:12:n1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here) 12 | DEFINE_ncclDevFunc(RReduceuScattner_RIWNG_orkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SISMIMPLEP, 4)L | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hE:611:62_: MinMax_u3note: expanded from macro 'DEFINE_ncclDevFunc' 2 611_ | R2unWor,kBatch , algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), N CCL_nPROtTO_hSIMrPLEe, 2a) d| ^ s/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h(nthreads), tidInBlock(threadIdx.x), gro:u611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | p( ^gro up)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h, | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h::670670:60: :note: field 'group' will be initialized after field 'stepSize' 15 670: | note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_4, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unrol/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_4, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ l>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads),/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(thread tidInBlock(threadIdx.x), groupIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gr o< subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_4, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ up(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_4, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_4, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tiid(tidd), nIthreands(nthBreadls), tiodInBclock(tkhread(Idx.xt), grohup(group), | ^~~~~~~~~~~r eadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_4, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32_4, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1200. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 87%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hIn file included from :173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:warning: 11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:unused variable 'w' [-Wunused-variable]173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrie75r_by_g | ro up( barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ :29:15:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h note: expanded from macro 'barrier_by_group' 29 | : co29nst i:nt w15 = th:readI dxnote: expanded from macro 'barrier_by_group' 29 | co.x/WARP_SnIZE;s t int w = threadIdx.x/WA\ | R ^ P_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:212: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h::11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: 174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145warning: :14: warning: unused variable 'flag1' [-Wunused-variable]unused variable 'data1' [-Wunused-variable] 145 | u int14532_t | data 1, flag1 , da uint3ta2, f2l_t data1, flag1, data2, flaagg2; 2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h :145:u21: iwarning: unused variable 'flag1' [-Wunused-variable] n 145 | t 3 ui2nt3_2_tt da ta1d, falagt1, adata12, ,fla g2;f | l ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.ha:145:g28: 1, data2, fwarning: lunused variable 'data2' [-Wunused-variable] a145 | g 2uin;t32 _ | ^~~~~t data1, flag1, data2, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, dflaag2;t | a ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h2:145:35: warning: unused variable 'flag2' [-Wunused-variable], f145 | l auintg32_2t; | ^~~~~ data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barbry_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 10 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_tIn file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ data1, fla/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cppg:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 1, da/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ta2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14 | : warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ [ 87%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u8.cpp.o In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_2, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_2, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_4, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_4, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_2, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSiIn file included from ze_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h| :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h group(group:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.hti:d(tid), nthreads(nthreads), tidInBlock(34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here t65hreadIdx | .x), group (group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | step Size(sterpSize_ ==u 0 ? nccnlShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(TRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_2, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_2, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_4, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /NCCL_ST E670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_4, nPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work-c>clFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_4, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work work); | ^ ->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_2, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_u64_2, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, In file included from nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:43215: warning: initializer order does not match the declaration order [-Wreorder-ctor] | 670 | tid (tid if (tid < subtn) RunWo), nthreads(nthreads), tidInBlock(threadIdrkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScattexr.x), g_roup(gRroup), I | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_N 671 | G st_epSize(SIMPLE_MinMastepSxize__ == u0 ? n6cclSh4mem.c_omm.b2uffSi,zes[N CCL_PnROTO_SIcMPLE]c/NCCLl_STEPFS/sizeof(T) : ustepSizne_) { c | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ R| educeScatter, Fun group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | pricMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); m\s(ti | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' d, nthread670s, & | ring ->pr ev, & ring ->netxt, iworkd->s(endbutff, iworkd->rec)vbuf,f, w ork->nredtOpArgh, 0,r worek->caonnIdndexs, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(60tid,: nth reanote: ds, field 'group' will be initialized after field 'stepSize'work ); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432670:78: note: | in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | tid(tid), nthreads(nthreads), t i d iIf n(tBidl ( ). r| ^~~~~~~~~~~ un(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_2, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173\ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(ti: d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (ReduceScatter_RING_SIMPLE_MinMax_u64_2, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_u64_2, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &rinIn file included from g->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hd, nthreads/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_2, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceS(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/catter_RING_SIMPLE_MinMax_u64_4, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4sizeof)(T) : stepS ize_) {| | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ ^| group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h :34:7:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | :prims(611tid, n:thread62s,: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | R &ring->prev, &ringIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_2, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(ti->next, work->sendbuff, work->recvbuff, work-unWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(thr>reedOpArga, 0, wodrk->coIndx.x), grnIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | oup(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_4, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_4, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hnote: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_4, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_4, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64_4, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBa(threadIdx.x), group(group), | ^~~~~~~~~~~ tch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h::75:7: warning: unused variable 'w' [-Wunused-variable]2: In file included from 75 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h barrie:r_by_grou11p(); | ^~~~~~~~~~~~~~~~~~ : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: In file included from note: expanded from macro 'barrier_by_group' 29 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h const in:t w 173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: = twarning: hreadIdx.unused variable 'w' [-Wunused-variable]x/WAR 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | constP_SIZE; \ | ^ int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:In file included from 15: note: expanded from macro 'barrier_by_group' 29 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h : const int w174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75 :7: warning: unused variable 'w' [-Wunused-variable]= 75 threadIdx.x/WARP | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int _SIZE; \ | ^ w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uIn file included from int32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: 145 | uin warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ t32_t data1, flag1,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, f data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ lag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flaIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ g1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_2, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_2, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_2, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_u8_2, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_2, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_4, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gro_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_2, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ up(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_2, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ id < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_4, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_2, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ reads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ >().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_4, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_4, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , redop, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_2, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_4, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_2, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_u8_2, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_4, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_2, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid),/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthr nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_4, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_4, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_4, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_4, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0,lock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group) work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_2, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8_4, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1100. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. [ 87%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const , fint w = threadIdx.x/WARP_SIZE; \ | ^ lag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_bf16_2, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_bf16_2, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkC/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSizeoll().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. [ 87%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_2, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16_4, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, In file included from head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:In file included from 2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h::173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:7511:: In file included from 7/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: : warning: unused variable 'w' [-Wunused-variable] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75 :75 | 7: barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int wIn file included from = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp::145:235: :In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.hwarning: :unused variable 'flag2' [-Wunused-variable]11 : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: 174145: | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h : 145 :u14in:t warning: 3unused variable 'data1' [-Wunused-variable]2 _t data1, flag 1145, | d a t a 2u,i nftl3ag22_;t d| a ^~~~~t a1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_gr ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11oup(: ); In file included from | ^~~~~~~~~~~~~~~~~~/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29::15: note: expanded from macro 'barrier_by_group' 29 | 174 const: int/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h w = th:readId75x.x/WARP_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); :7: | ^~~~~~~~~~~~~~~~~~ warning: S/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const unused variable 'w' [-Wunused-variable]IZE; int w = threadIdx.x/WARP_SIZE; \ | ^ 75 | \ | ^ barrier_by_ group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uinint32_t32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611In file included from | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadI/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_bf8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_bf8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRin/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Algo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1100. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 88%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cppIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_f16_2, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_f16_2, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_2, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16_4, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx908. 1010 warnings generated when compiling for gfx1100. warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 88%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx908. [ 88%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_f32_2, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, prIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_f32_2, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ oto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreaIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, wods(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173rk->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_2, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h10 warnings generated when compiling for host. :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32_4, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_f64_2, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_f64_2, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_2, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64_4, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1200. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. [ 88%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx906. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 89%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const iIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ nt w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.ha:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174t: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uaint32_t dat2a1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ , flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h::175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: 5unused variable 'w' [-Wunused-variable] 80 | : barrie rwarning: unused variable 'w' [-Wunused-variable] 80 | barr_iby_group(e); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hr_:29by_group(); | ^~~~~~~~~~~~~~~~~~:15: note: expanded from macro 'barrier_by_group' 29 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' const int w = threadIdx.x29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = thIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cppreadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: :2: warning: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:unused variable 'data1' [-Wunused-variable]174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_b y_group() ; | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, dat/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ a2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | co/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ nst int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, fIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ lag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_f8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthrea/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hds(nth:670:15:r warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | e tid(tid), anthreads(nthdreads), tidsInB), tidInBlock(threadIdx.xlock(threa)dIdx.x), grou,p(group) ,g r o| up(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | step| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSizSeize(stepSiz_e_ == 0 ? n)cclShmem.c omm.buffS{izes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grou_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_f8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ p(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIn file included from Index, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlo65:5c: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | k runRing<(T, RedOp, Ptroto, COLL_hUNROLL>(tidr, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.he:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested herea 432 | d iIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~f (t id < subtn) RunWorkCo| ll().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:12::1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 34 12 | DE:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ FINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_2, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ Arg, 0, work->coIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ nnIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8_4, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = thIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIreadIdZx.x/WARPE_SIZE; ;\ | ^ \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | coIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ nst int w = /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const inthreadIdx.x/WARP_SIZE; \ | ^ t w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' In file included from 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ _t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, fIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ lag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hint32_t :data1,29 flag1,: data2,15 flag2:; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h :145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_note: t dataexpanded from macro 'barrier_by_group' 29 | const int w = thre1, aflag1, ddata2, Iflag2; d| ^~~~~ x.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_In file included from SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable]In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_u32_2, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:In file included from 12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevF/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: unc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: note: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hexpanded from macro 'DEFINE_ncclDevFunc':670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid611), nth | reads (nthrea ds), ti dInBlo ck(thRreadIdxu.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | n tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | W steopSize(rstepSkize_ =B= 0 ? ancclShtmch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlockP(LE]/NCtCL_STEhPS/sizreadIdx.x), group(geof(Tr) : stoepSizeu_) { | p ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h):34:,7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h prims(tid, n:thread670s, &:ring->60prev, &ring-:>ne xt, wonote: rk->senfield 'group' will be initialized after field 'stepSize'db 670 | uff, work-t>id(tid),recvbuff, work->redOpArg, 0, wo nthreads(nthreads), tidInBlock(threadIdx.x), group(groupr)k->,conn Inde x| , wo ^~~~~~~~~~~rk-> connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduceScatter, FuncPreMulSuIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->m, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads),connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWork/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmeBatcmh, almgo, pr.oto, bunrolul>().frun()f; \ S| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hi:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' z670 | e tis[NCCL_PROTO_Sd(tIid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tidMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->conn(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Index, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_u32_2, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_2, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32_4, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1201. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. [ 89%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7:: 29warning: :15unused variable 'w' [-Wunused-variable]: note: expanded from macro 'barrier_by_group' 29 | 75 | c o n sbta rirnite rw_ b=y _tghrroeuapd(I)d;x . x| / ^~~~~~~~~~~~~~~~~~W ARP_S/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hI:Z29E:;15 :\ note: expanded from macro 'barrier_by_group'| ^ 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uintIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threa dI670d | x. x ) ,t igdr(otuipd()g,r onutph)r,e a d| ^~~~~~~~~~~s (nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_u64_2, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_u64_2, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_2, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64_4, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1030. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. [ 89%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1100. [ 89%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WAIn file included from RP/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp_:S2I: ZIn file included from E/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h;: \11 : In file included from | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h ^: 174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_u8_2, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(groupIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_u8_2, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , Proto, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWork:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_2, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Batch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8_4, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_bf16_2, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_2, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_2, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_2, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_2, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_bf16_2, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_4, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_2, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:: 2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_2, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadId:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | x. x), group (group), | tid(tid), nthreads(nthre ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSiads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) zes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->re{ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, workcvbu-ff, w>ork-r>redOepArg,c 0, vwork-b>connuIndex,f workf->con,nInde x); | w ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:o65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested herer k->redOpArg, 0, work->connIndex, work->connInd 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: ex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkCollnote: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here< 432F | n if, (ti d T< sub,tn) RunRWorkeColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reducelgo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_4, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Scatter_RING_SIMPLE_Prod_bf16_2, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_4, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_4, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_2, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_2, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(th:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ readIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_4, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkCol/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hl:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | ().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_4, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62 runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_4, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreaIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_2, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ds), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_2, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_4, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_4, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_4, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16_4, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1030. 11 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1100. 11 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. [ 90%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp 10 warnings generated when compiling for gfx908. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 90%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_2, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_2, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_4, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_4, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_2, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_2, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_2, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_2, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_bf8_2, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.commIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_2, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_2, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCC2L_A;L GO _| R ^~~~~I NG, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_4, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_4, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_4, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_4, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_bf8_2, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_2, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_2, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_2, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_4, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_4, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_4, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_4, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8_4, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_2, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_2, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_4, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_2, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_4, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_2, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_2, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_2, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_2, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_2, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_f16_2, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_4, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_2, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_4, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_4, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_4, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_4, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_f16_2, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_4, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_2, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_ProIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_d_f16_4, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_2, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_4, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16_4, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthrea(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1030. 1010 warnings generated when compiling for gfx1100. warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx906. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 90%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group();In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ rier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_grouIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ p(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable]In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ E; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] _ 75 | b barriery_by_group_(); | ^~~~~~~~~~~~~~~~~~ g/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: rnote: expanded from macro 'barrier_by_group' 29 | o const intu w = threpadIdx.x/(WARP_SI)ZIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7:; E; | ^~~~~~~~~~~~~~~~~~ \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = thre warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ adIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_2, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_2, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | run /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Ring(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_2, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkCollwarning: ()field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]. run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_2, ncclFun c496R | e d u cteiSdc(atitdt)e, rn,t hrFeuandsc(Pnrtohrde,a dsf)l,o awitd,( tiNdC%CWL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_f32_2, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_f32_2, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSizeIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | t(istepSdize_ =(= 0 ?t nciclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ d)| , nthread group(groups(nth reads), tidIn/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_2, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Block(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_2, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid10(tid) warning, nthrseads( generatednthreads), tidInBlock(threadIdx.x), group(group), 10 warnings generated when compiling for gfx1200. | ^~~~~~~~~~~ when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_2, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_2, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_2, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_4, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_4, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_4, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_4, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_4, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_2, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_4, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_4, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_4, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_4, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 90%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_2, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_4, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32_4, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14:: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_guirnt32_t daota1, flag1u, data2p, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable]( 145 | )uint32_t d;ata1, f lag1, | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int data2w, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28=: warning: unused variable 'data2' [-Wunused-variable] 145 | t h r euadIdx.x/int32_Wt dIn file included from ARP_SIZE; ata1\, fla/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cppg:2 1 ,| ^: d ata2, flag2; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.xIn file included from / | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1,WARP_SIZE; \ | ^ flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t daIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ta1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_tint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ WARP_SIZE; \ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_2, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_2, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_4, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_4, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_2, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_2, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_2, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_4, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_2, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto,:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.com unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ m.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_4, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_4, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tidIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_2, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ %4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_f64_2, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_2, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_4, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_4, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_4, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_2, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_f64_2, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_2, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_2, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_4, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1102. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_4, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RI/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64_4, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), NG, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ nthreads/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h(:670:15:n note: field 'nthreads' will be initialized after field 'tidInBlock' t670 | hreads tid(tid), ), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreadsnthr)eads(nthreads), ti,dInB lock(threadtIdx.xi), gdrouIp(groupn), Blo | ^~~~~~~~~~~~~~~~~ c/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:k60: (note: field 'group' will be initialized after field 'stepSize' t670 | h tird(tid)e, nthareadds(nthIrdex.x), group(group), | ^~~~~~~~~~~ ads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1030. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 91%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from 10 warnings generated when compiling for gfx1102. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10In file included from warnings generated when compiling for gfx1101. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_grouIn file included from p(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t dIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ata1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ , data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: uint3229:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ _t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_2, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_2, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_f8_2, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSiIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_2, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ze(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, wor/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (k); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_2, ncclFuncReduceScatter, FuncProtdid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_4, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_2, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for gfx942. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_4, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_4, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. [ 91%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u32.cpp.o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp 670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_4, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_4, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreaIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_2, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_f8_2, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_2, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_2, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group)In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | , | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_ST group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_2, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ EPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_nc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_2, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611::67062:15: :warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | note: tidexpanded from macro 'DEFINE_ncclDevFunc'(tid ), nthreads611(nth | re RunWorkBatch, aelgo,p protSo, iunrozll>(e).ru(n(); s\ tepSi| ^z /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.he:670_ == 0 ? ncclShm:15:e note: field 'nthreads' will be initialized after field 'tidInBlock' m 670 | . ctid(otidmm.b)u, ntfhfSizeresads([nNCCL_thPreaRds)O,T tO_SIMPLE]/idInBlock(threadIdx.x), group(group)NC,CL_ ST EPS| /si ^~~~~~~~~~~~~~~~~zeo f(T/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h) : st:epS670ize:_) {60 : note: field 'group' will be initialized after field 'stepSize' | 670 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h :34 tid(t:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here id), nth34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbufrfead,s(n threwadso), rtikdIn-Blo>ck(rthreeadcIdxv.bx),u grofup(fgroup), | ^~~~~~~~~~~ , work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_4, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().ruIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_2, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ n(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nt/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_4, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_4, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.ho:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_4, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_4, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8_4, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_2, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_4, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCLIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_)_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvb { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_2, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^uff, work->redOpArg, 0, work->connIn d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_2, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_2, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_2, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_4, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_SIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_2, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ TEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_4, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().ru/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_4, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ n(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_4, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_2, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here ING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_u32_2, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_u32_2, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_2, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_2, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_2, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_4, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_4, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_4, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_4, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING,ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->conn NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Index); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRi/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_4, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ng(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_2, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32_4, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 91%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1100. [ 91%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZEIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_2, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_2, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_2, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oll, ty, redop, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_2, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_2, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_4, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_4, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_4, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_4, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_4, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_2, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_2, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthrIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_2, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_u64_2, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_u64_2, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_2, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_2, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_4, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_4, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_4, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_2, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_4, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_4, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64_4, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t In file included from data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_u8_2, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_2, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_2, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_2, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_2, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_2, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_2, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_2, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_4, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_2, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_u8_2, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_4, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: In file included from field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_2, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_4, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_4, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] >().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_2, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_2, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_4, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_4, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_4, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_4, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_4, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_4, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8_4, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1030. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. [ 92%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1101. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 92%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t daftla1a,g 1f,la gd1a,t ad2a,t af2,la fgl2a;g 2 ; | ^~~~~| ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h3:2_145t: 21d:a tawarning: 1unused variable 'flag1' [-Wunused-variable], flag1, d a145t | a 2 , f luaign2;t 3 2| _ ^~~~~ t /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hd:a145t:a35:1 ,warning: unused variable 'flag2' [-Wunused-variable]f lag1 ,145 | d a t aui2n,t 3f2_lta gd2a;t a 1| , ^~~~~f lag1/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h,: d145a:ta282:, warning: flunused variable 'data2' [-Wunused-variable]a g2; | ^~~~~ 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_2, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_4, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_2, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_bf16_2, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_bf16_2, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_2, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_2, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_2, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, w10 warnings generated when compiling for host. ork); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_4, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_2, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_2, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_2, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_2, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_4, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_4, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tidl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_4, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_2, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_2, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_4, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_4, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_4, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_4, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_4, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16_4, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | In file included from uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_2, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_bf8_2, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_2, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_2, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_4, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_4, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_bf8_2, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ , T, RedOp, Algo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_2, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_4, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_2, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_2, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_2, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_2, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_2, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_2, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_4, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_4, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_4, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_4, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_4, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_4, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_2, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_4, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8_4, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx908. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 92%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_f16_2, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_2, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_2, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_2, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_4, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_4, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_2, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_2, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_4, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_2, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_2, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_4, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_4, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_f16_2, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_2, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_2, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_2, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) Run/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:WorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_2, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_4, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(g/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hrou:p670):,15 : | warning: ^~~~~~~~~~~~~~~~~ initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670670 | | ttiidd((ttiidd)),, nntthhrreeaaddss((nntthhrreeaaddss)),, ttiiddIInnBBlloocckk((tthhrreeaaddIIddxx..xx)),, ggrroouupp((ggrroouupp)),, | | ^~~~~~~~~~~ ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_4, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_4, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthrea().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_4, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ds), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_4, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16_4, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1100. [ 92%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:In file included from 7: warning: unused variable 'w' [-Wunused-variable] 75 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2 : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:barrier_by_grou75:p7: warning: unused variable 'w' [-Wunused-variable] (75 | ) ; | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uinIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ t32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from 10/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | cons21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ t int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_2, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_2, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_2, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_2, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_2, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScat/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_4, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_4, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algoter_RING_SIMPLE_Sum_f32_2, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, workIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(ti->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_2, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ d), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_f32_2, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_4, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_2, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_2, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_4, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_2, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_f32_2, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_4, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_4, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_2, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_4, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_4, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_4, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_4, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 93%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32_4, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cppIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_2, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_4, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_2, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_2, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_2, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_4, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_2, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_4, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_4, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_2, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_f64_2, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_4, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_2, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_4, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_4, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_2, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_f64_2, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_2, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(thrIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_2, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_2, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_4, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threaoup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work);dIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_4, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_4, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1030. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64_4, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1102. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 93%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp 10In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; warnings generated when compiling for gfx1102. | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ :12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | coIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28:nst int warning: w = unused variable 'data2' [-Wunused-variable]thr eadI dx.x/WA145RP_SI | ZE; \ | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIn file included from Idx.x/WAR/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2P: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11_: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173S: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:I7: warning: unused variable 'w' [-Wunused-variable] Z 75 | E ;In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:barri er_by175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ _group(\); | | ^ ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_2, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | Run/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_2, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ WorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_f8_2, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_4, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBloty, redop, algo, proto, unroll>().run(); \ | ^ ck(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nth/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_4, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ reads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_2, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:In file included from 60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_f8_2, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_2, ncclFuncReduceScatter, FunIn file included from cSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(thread/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid),I dx.x), group(group), | ^~~~~~~~~~~ nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_2, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(roll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tnithreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_2, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ d(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads 670 | tid(t)i, tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_2, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ d), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for gfx942. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_In file included from f8_4, ncclFun/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ =cReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unr= 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34oll>:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_2, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_2, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_4, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_4, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_< subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_4, ncclFuncReducRING_SIMPLE_Sum_f8_4, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.htidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_4, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 93%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u32.cpp.o In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? nc/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp clShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_2, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_4, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work-In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : s>recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRitepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SUNROLL>(tid, nthreads, work); | ^u m_f8_2, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_4, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8_4, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx uint3.2_t data1x, flag1,/ data2W, flag2;A | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145R:21: warning: unused variable 'flag1' [-Wunused-variable] P 145 | u_int32_tS data1, flag1, data2, fIlag2; | In file included from ZE; \ | ^ ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hIn file included from :173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | : warning: unused variable 'flag2' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp : uint32_2t data1,: flag1, In file included from data2, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.hflag2; : | ^~~~~ 11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:: 2/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h: :145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h :174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h uint32_t data1,:75:7 : warning: unused variable 'w' [-Wunused-variable] f75 | l baarrier_bby_grouap(); | ^~~~~~~~~~~~~~~~~~r /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hg:29:15r: 1note: expanded from macro 'barrier_by_group', data2, fielr_by_garog2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hup(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2;: 15: note: expanded from macro 'barrier_by_group' 29 | | c ^~~~~onst int /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hw = thread:Idx.x145/WAR:P_SIZ28E; \: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t d | ^ aIn file included from ta1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2;: | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_2, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_2, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_2, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_4, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_u32_2, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMP | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NLCE_Sum_u32_2, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:CL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | 60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_u32_2, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | endbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_2, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_2, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_2, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_4, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Op, Algo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_4, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_2, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_4, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_2, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_4, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_4, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_4, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_2, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBat/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), CL_PROT| O_SIMPLE] ^~~~~~~~~~~~~~~~~/NCCL_STE PS/sizeof/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h(T) : ste:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | pSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34 :7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, worIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthrk->recvbuff, work->r tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group),e ads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_2, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(n | ^~~~~~~~~~~ edOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_4, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_4, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_4, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32_4, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1200. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 93%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1101. [ 94%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = tIn file included from hreadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_2, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_u64_2, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_2, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_2, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_4, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_4, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_2, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_4, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_2, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_4, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_2, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_2, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_2, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_2, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_u64_2, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_2, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_4, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_4, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_4, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_4, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_4, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_2, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_4, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64_4, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_2, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_2, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_2, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_2, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_4, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_2, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_2, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_4, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_2, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_4, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_4, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_2, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_4, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_4, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from oup), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_u8_2, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_2, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < s/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_2, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ubtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_4, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_4, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_u8_2, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ d), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_2, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ri:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_4, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ng->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_4, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8_4, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx906. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 94%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1030. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. In file included from [ 94%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp.o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_i32_2, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), groIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group up(group), /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h| : ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~34 : 7| : tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 671 | 34 | s t e p Spirziem(ss(tteipdS,i znet_h r=e=a d0s ,? &nrcicnlgS-h>mperme.vc,o m&mr.ibnugf-f>Sniezxets,[ NwCoCrLk_-P>RsOeTnOd_bSuIfMfP,L Ew]o/rNkC-C>Lr_eScTvEbPuSf/fs,i zweoorfk(T-)> r:e dsOtpeApSrigz,e _0), {w o r| k ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~- > c| o group(groupn nIndex, work->connInde/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.hx:)34;: 7 :| ^note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h: 6534: | 5 : note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here prims (65t | i d , nrtuhnrReiandgs<,T ,& rRiendgO-p>,p rPervo,t o&,r iCnOgL-L>_nUeNxRtO,L Lw>o(rtki-d>,s enndtbhurfefa,d sw,o rwko-r>kr)e;c v b| u ^f f, work->red/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hO:p432A:r78g:, 0note: ,in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here work->connI n432de | x , w o r k-i>fc on(ntIindd e, ProtoSimple<2, 2, 4>, 4>' requested heren , T, R e65d | O p , ArlugnoR,i nPgr (C)O.LrLu_nU(NtRiOdL,L >s(utbitdn,, nwtohrrke)a;d s ,| ^w ork); | ^/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp :7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here7 | DEFINE_ncclDevFunc(ReduceScatter_ R432I | N G _ S I MiPfL E(_tSiud m

_(t),. rNuCnC(Lt_iAdL,G Os_uRbItNnG,, wNoCrCkL)_;P R O| T ^O _SIMPLE, 2) /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp :| 12^: 1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 12 | DEF I611N | E _ n c cRluDneWvoFruknBca(tRcehdP,L Ea_lSguom,P opsrtoDtiov,_ iu3n2r_o4l,l >n(c)c.lrFuunn(c)R;e d\u c e| S ^c atter, F/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hu:n670c:S15u:m Pnote: ofield 'nthreads' will be initialized after field 'tidInBlock's tDiv, 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_i32_2, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | b data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ arrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = thIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ readIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_i64_2, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_i64_2, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSizeIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), g(stepSize_ ==roup(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.b:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROuffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, wTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->reork->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRingconnICndex, Owork->LconnInLdex)_; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthUNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ reads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>()In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ .run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1200. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 94%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx908. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 95%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group()In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1,; fl a| g ^~~~~~~~~~~~~~~~~~1 , data2, flag2; /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h| : ^~~~~ 29:15/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:: 145note: :28expanded from macro 'barrier_by_group': warning: unused variable 'data2' [-Wunused-variable] 14529 | | ucionst int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ nt32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_i8_2, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSi/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11ze_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_i8_2, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173 : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cppIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2;In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_u32_2, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_u32_2, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ LL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670In file included from :60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1030. 11 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1201. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx942. [ 95%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp [ 95%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_grouIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ p(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->seIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_u64_2, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ ndbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, wIn file included from ork); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, wo/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &rinrk); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here g->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ n) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(thr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.headIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tid tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev,InBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ &ring->next, work->sendbuff, woIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | rk->recvb if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTuff, work->redOpArg, 0, work->connIndex, work->connIndex); | O_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_u64_2, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthread/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670s(nthrea:ds), wid15(tid%WA:RP_SIZE), warp(tidwarning: /WARPinitializer order does not match the declaration order [-Wreorder-ctor]_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | w arpInBlock(threadId670x.x/W | ARP_SIZE ) , | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%tid4(tid),) nthre=ads(nth=reads)3, ti), gdInBlroup(grIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_u8_2, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ oup)ock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? nc, | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~c | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 l499 | SstepSihze(nccmlShmem.ecomm.bufmfSizes[.NCCL_PRcOTO_LL128o]/NCCL_SmTEPSm.buffSizes[NCCL_PROTO_SIMPLE]/NCC/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, L_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring&ring-->/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hn:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads),e>xt, woprk-r>sendebuff, vwork-,>recv b&uffring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, , work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRingc8onnI,ndex , worCk->coOnnInLdex);L | _ ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65U:5: note: Nin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 65R | OrunRinLgp(ti, Pd, nthreads,ro to, CwOLL_UoNROrk); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:LL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) 78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkCollOp(, )Al.gruo,n (Ptrotio, COdLL,_U NROsLuLbtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceS>(c).run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_aSttIMerP_RILNGE_L_L1S28u_SmumPPoostsDtivD_ui8_v2, n_cucl6FuncReduceSca4_t4,t necr, FuncSumPostDiv, uint8_t, NCCL_cAlFLunGcROed_ucReSIcaNttGer,, F unNcCSuCmPoLst_DiPv,R uOinTt6O4__tL, LNC1CL2_A8LGO,_R IN2G,) N CCL _| P^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatROTcOh_Sl, lalg,o, ty, redop, algo, proto, unroll>().run(); \ | ^ proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | sIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_R/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthrea/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ds), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreaIn file included from ds, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSiIn file included from ze_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | st/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | t:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ id(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1101. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. [ 95%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1100. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 96%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' :15: note: expanded from macro 'barrier_by_group' 29 | cons29t int w | = thread Idx.x/ const int w = threadIdx.x/WARP_SIZE; \ | ^ WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 75 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_In file included from group/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: (In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:)7: warning: unused variable 'w' [-Wunused-variable] 75; | ba r | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15:rier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2In file included from : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, In file included from data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp145:35: warning: unused variable 'flag2' [-Wunused-variable] : 145 | 2 uin: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:t32_t d80ata1, f:lag1, dat5a2, f:lag2; | ^~~~~ warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_groIn file included from up(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, f note: expanded from macro 'barrier_by_group' 29 | const lag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_2, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_bf16_2, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_2, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_4, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_2, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_2, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_4, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_bf16_2, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~10 warnings generated when compiling for host. | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_4, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreadIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: s, &ring->prev, &rin/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSig->next, work->sendbuff, work->recvbuff, zwes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here ork->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | , nthrDEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_2, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_2, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.htid, sub:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tidtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_2, ncclFuncReduce, FuncSum, hip_bfloat16,), nNCCL_ALGO_RING, NCCL_PROTO_SIMPLEthr,eads (nth2read)s), tidI nBlo| ck^(thr eadI/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hdx.x), :grou611p(:gro62up),: | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_note: 671expanded from macro 'DEFINE_ncclDevFunc' | ste pSize(611step | Siz e_ = = 0 ? nc clShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepRunWorkBatch, algo, proto, unroll>().Sizre_) u{ n(); \ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h ^:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h | pr:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBilms(toid, cnthrekads,( &ritngh->prrev, e&raingd->neIxt, wdork-x>sen.dbufxf, w)ork, group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_4, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_2, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_2, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | D/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_2, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, a lgo, prnoto, unrcoll>().crun(); l\ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hS:670:h15: note: field 'nthreads' will be initialized after field 'tidInBlock' m670 | teid(tid)m, nthrea.ds(nthrceads), toidInBlomck(thrmeadIdx.x.), grboup(grouup), f | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:fSizes[NCCL_PROTO_SIMPLE]/NCCL_ST670:60: note: Efield 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(ntPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, worhkread-s), >tidInrBloeck(thcreadIdvx.x),b grouup(grfoup),f | ^~~~~~~~~~~ , work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidI 432 | ifnBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem. (tidcomm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | ru < subtn) RunWorkColl(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_2, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RINNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFuncG(, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Reduce_RING_SIMPLE_Sum_bf16_4, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_4, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_4, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), protgroup(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_4, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCLo, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gr_oPROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ up), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_4, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_4, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16_4, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145In file included from :21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, da/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from ta2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h145:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h::80:5: warning: 35unused variable 'w' [-Wunused-variable] 80: warning: unused variable 'flag2' [-Wunused-variable] 145 | | barrie r_by_g roup() ; | ^~~~~~~~~~~~~~~~~~ u/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15:i note: expanded from macro 'barrier_by_group' nt32_t data1, 29 | consft int lw = thareadIdgx.x/WA1RP_S,IZE; da\ | t ^ a2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ hreadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21:1 , data2, flag2; | ^~~~~ warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_2, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_bf8_2, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads)670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | , tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_2, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_4, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_2, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_2, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_2, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &In file included from ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_2, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeoIn file included from f/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run((uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, wtid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here ork-> 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_2, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadI work->recvbufdx.x), group(group), | ^~~~~~~~~~~ f, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_bf8_2, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_2, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RIn file included from unWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthread/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:s2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:(11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:n173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670t:15: hwarning: initializer order does not match the declaration order [-Wreorder-ctor] r670 | e tiad(tid)d, nthsreads)(nthreads),, ti dIntBlocidInBlock(threadIdx.x), group(grk(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PRoup), | ^~~~~~~~~~~ OTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_2, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redO/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDepvArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_2, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Func(Reduce_RING_SIMPLE_Sum_bf8_4, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_4, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4dInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nth)r | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_2, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_4, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_4, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE,, tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_4, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_4, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid),:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : ste/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connInpSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^dex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if ( /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.ht:63:5:i note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here d63 | runR(tid), nthr eadRunWorkCollk); | ( ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h):432:78: note: .in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tirun(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_4, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, d,N subCtn, wCorkL); _| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cppP:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested hereR 12O | DEFITNE_nOcclDe_vFunSc(ReIduceM_RINPG_SILMPLEE_Sum_bf8_,4, n cclFu4ncRe)duce , Fu ncSu| m^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: , rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group),note: field 'group' will be initialized after field 'stepSize' 670 | | ^~~~~~~~~~~~~~~~~ t id(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.htid), :nt670hre:ads60(nt:hr enote: field 'group' will be initialized after field 'stepSize' 670ads), tidInBlock(threadIdx.x), group(group), | | ^~~~~~~~~~~ti d(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_4, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8_4, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1030. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 96%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, In file included from head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h::75:7: warning: 173unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ , flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ IZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_2, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_4, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_2, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_2, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_2, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_f16_2, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_f16_2, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_2, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_2, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_2, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_2, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_2, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_4, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_2, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_4, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_2, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_4, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_4, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_4, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_4, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | step/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_4, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_4, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_4, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16_4, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1102. [ 96%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1100. 10In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 10 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 10 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp :data21: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ , flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11In file included from : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp5:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_2, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_2, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_2, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_2, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_2, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2)In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthread | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ s(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_2, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 96%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f64.cpp.o In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_f32_2, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_2, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_2, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h : 670i:f15 :( tiwarning: d initializer order does not match the declaration order [-Wreorder-ctor]< subtn) RunWorkCo l670l | t(i)d.IrnuBnl(otcikd(,t hsruebatdnI,d xw.oxr)k,) ;g r o| u ^p (group)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp,: 7 :| 1 ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~: note: | in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 7671 | | D E F I NsEt_enpcScilzDee(vsFtuenpcS(iRzeed_u c=e=_ R0I N?G _nScIcMlPSLhEm_eSmu.mc_ofm3m2._b2u,f fnSciczleFsu[nNcCRCeLd_uPcReO,T OF_uSnIcMSPuLmE,] /fNlCoCaLt_,S TNECPCSL/_sAiLzGeOo_fR(ITN)G ,: NsCtCeLp_SiPROzTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ e_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_4, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_4, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_4, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_4, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_4, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_4, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_4, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_4, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_2, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_f32_2, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_4, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_2, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h10 warnings generated when compiling for host. :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_4, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32_4, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_2, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_2, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbu f ft,i dw(otrikd-)>,r endtOhprAeragd,s (0n,t hwroerakd-s>)c,o ntniIdnIdneBxl,o cwko(rtkh-r>ecaodnIndIxn.dxe)x,) ;g r o| u ^p (group), | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~: 63 :5| : tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | r671un | R i n g c(ltSihdm,e mn.tchormema.dbsu,f fwSoirzke)s;[ N | C ^C L_PROTO_S/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hI:M432P:L78E:] /note: Nin instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested hereC CL_STEPS /432s | i z e o f ( Ti)f :( tsitde p, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested hereL L>().run(tid ,33 | s u btn, w o r kp)r;i m s| ( ^t id, nt/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpph:r7e:a1d:s ,note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here& ring->pre v7, | D&ErFiInNgE-_>nncecxltD,e vwFournkc(-R>esdeuncdeb_uRfIfN,G _wSoIrMkP-L>Er_eScuvmb_uff6f4,_ 2w,o rnkc-cl>FruendcORpeAdrugc,e ,0 ,F uwnocrSku-m>,c odnonuIbnled,e xN,C CwLo_rAkL-G>Oc_oRnInNIGn,d eNxC)C;L _ P| R ^O TO_SIM/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hP:L63E:,5 2:) note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h63: | 611 : 62 : rnote: uexpanded from macro 'DEFINE_ncclDevFunc'n Ring,( trieddo,p r,e aadlsg,o ,w oprrko)t;o , | u ^n roll>().run/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h():;432 :\78 : | note: ^in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :432670 | :15 : note: field 'nthreads' will be initialized after field 'tidInBlock' if (ti d670 | < s u bttind)( tRiudn)W,o rnktChorlelag(r)o.urpu(ng(rtoiudp,) ,s u b| t ^~~~~~~~~~~~~~~~~n , w/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.ho:r670k:)60;: note: | field 'group' will be initialized after field 'stepSize' ^ 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp : 12 :t1i:d (note: tin instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested herei d), nthre a12d | sD(EnFtIhNrEe_andcsc)l,D etviFduInncB(lRoecdku(cteh_rReIaNdGI_dSxI.MxP)L,E _gSruomu_pf(6g4r_o4u,p )n,c c l| F ^~~~~~~~~~~u ncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_2, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_2, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_2, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_f64_2, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_2, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_4, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_4, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_4, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_4, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_2, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_f64_2, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_4, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tidIn file included from ), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_2, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested hereIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_2, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_2, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_4, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_4, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_4, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_4, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64_4, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1101. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 97%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 11 warnings generated when compiling for gfx942. [ 97%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_2, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_f8_2, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_2, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_2, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_2, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_4, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_2, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ >().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_4, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_4, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_2, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_2, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_4, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gro62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_2, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ up), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_2, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_4, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_4, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_4, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_4, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_2, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_f8_2, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_2, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_4, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_4, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8_4, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ , flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_2, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_2, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_2, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_4, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_2, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_2, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_2, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_4, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_u32_2, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_4, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_u32_2, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_2, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_2, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_2, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_2, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(step/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), Size_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_4, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_4, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_4, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_2, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_4, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_4, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_4, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_4, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32_4, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for gfx942. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 97%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1201. [ 97%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_2, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_2, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_2, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/s iz670e | o f ( T )t i:d (sttiedp)S,i znet_h)r e{a d s| ( ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~n t h| r group(groupe ads), tidInBlock(threadIdx/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h.:x)33,: 7g:r onote: uin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested herep (group), | ^~~~~~~~~~~~~~~~~33 | pr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hi:m670s:(60t:i dnote: ,field 'group' will be initialized after field 'stepSize' nthreads ,670 | & r i n g->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_2, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBattcihd<(ctoildl),, tnyt,h rreeaddosp(r,e aadlsg)o,, tpirdoItnoB,l oucnkr(otlhlr>e(a)d.Irduxn.(x));, \g r o| u ^p (group)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h,: 670 :| 15 ^~~~~~~~~~~: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_4, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_2, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_4, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_4, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_2, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_4, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_4, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_2, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_2, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_4, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_2, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_u64_2, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_4, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_u64_2, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_2, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_4, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_2, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_4, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_4, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64_4, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t dataIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_2, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_2, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_4, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_2, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_2, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_u8_2, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ ) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_4, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10In file included from warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_u8_2, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_2, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_2, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_4, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_2, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_4, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_2, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_4, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_4, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_GO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_2, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_4, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_2, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_4, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_2, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_4, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_4, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8_4, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 98%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1100. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 98%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; In file included from | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint3In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WAIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: 2_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ RP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | constIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_i32_2, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_i32_2, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkCollIn file included from ()/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp.:r2u: nIn file included from (/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.ht:i11d: ,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hs:u173b: tn/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h,: 670w:o15r:k )warning: ; initializer order does not match the declaration order [-Wreorder-ctor] | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here670 | tid( t7i | dD)E,F InNtEh_rnecacdlsD(envtFhurneca(dRse)d,u ctei_dRIInNBGl_oScIkM(PtLhEr_eSaudmIPdoxs.txD)i,v _gir3o2u_p2(,g rnocucpl)F,u n c| R ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~e d u| c tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_e , FuncSum P671o | s t D i vs,t eipnSti3z2e_(ts,t eNpCSCiLz_eA_L G=O=_ R0I ?N Gn,c cNlCSChLm_ePmR.OcToOm_mS.IbMuPfLfES,i z2e)s [ N| C^C L_PROT/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hO:_611S:I62M:P Lnote: Eexpanded from macro 'DEFINE_ncclDevFunc'] /NCCL_ S611T | E P S / sRiuzneWoofr(kTB)a t:c hs , algo, proto, unroll>().run(); \ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h :| 33 ^: 7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :33670 | : 15 : note: field 'nthreads' will be initialized after field 'tidInBlock' prims(t i670d | , n t htrieda(dtsi,d )&,r inntgh-r>epardesv(,n t&hrrienagd-s>)n,e xtti,d IwnoBrlko-c>ks(etnhdrbeuafdfI,d xw.oxr)k,- >grreocuvpb(ugfrfo,u pw)o,r k -| > ^~~~~~~~~~~~~~~~~r edO/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hp:A670r:g60,: 0note: ,field 'group' will be initialized after field 'stepSize' work->c o670n | n I n d etxi,d (wtoirdk)-,> cnotnhnrIenaddesx()n;t h r| e ^a ds), t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hi:d63I:n5B:l onote: cin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested herek (threa d63I | d x . x )r,u ngRrionugp<(Tg,r oRuepd)O,p , | P ^~~~~~~~~~~r oto, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_2, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); :78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32_4, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_i64_2, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(thr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tieadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx. | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_i64_2, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl nthrea(ds)(.nrtuhnrea(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_2, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ds), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64_4, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1201. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx90a. [ 98%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1201. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 98%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from 174/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_i8_2, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreadIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: s(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | 670t | i d ( t itdi)d,( tnitdh)r,e andtsh(rnetahdrse(andtsh)r,e atiddsI)n,B ltoicdkI(ntBhlroecakd(Itdhx.rxe)a,d Igdrxo.uxp)(,g rgoruopu)p,( g r| o ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~u p )| , tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ | ^~~~~~~~~~~ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_i8_2, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_2, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8_4, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ rier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_u32_2, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(groIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ up), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_u32_2, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), ntIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreahreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_2, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32_4, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx906. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for gfx942. [ 99%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp [ 99%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1In file included from : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | conIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ st int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ rier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | In file included from uint32/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrie_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | r_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: :In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174 : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14:warning: warning: unused variable 'data1' [-Wunused-variable] unused variable 'w' [-Wunused-variable]145 | u int3 2_t data1, fla80g1, dat | a2, fla g2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145 :21: warning: unused variable 'flag1' [-Wunused-variable] 145 | b uinta32_t darta1, flrag1, daita2, er_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from const int w = threadIdx.x/WARP_SIZE; \ | ^ _t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ , flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flagIn file included from 1, da/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hta2, :flag2175; : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5:| ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, fl warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2\: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^ ag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ bIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ arrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const iIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ nt w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_u64_2, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tidIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PR%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_u64_2, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_ROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_u8_2, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ ING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduce, FuncSumPostroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hn:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto,cclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(groupIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &rin unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ g->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | r| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ unRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cppnote: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here :7 | DE2FINE_ncclDevFun: c(RedIn file included from uce_RI/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hNG_SIM:PLE_SumPostDiv_u8_2, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPos/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tDiv_u8_2, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROT/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recMPLvE]/NCCbL_STEPSu/sizeoff(T) : stfepSize_,) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group w/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.hor:33k->redOpArg, 0,:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here w33 | prims(tid, nthIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &rreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, ork->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (ti0,d wor k->conconnbIndex)t; | n ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h):63: 5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested hereR 63 | u nWor rkunRCoingprev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ edOp, Proto, COLL_UNROLL>(tid, nthreads, work); /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RI| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:ll78().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduNG_SIMPLE_SumPostDiv_u8_4, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(step/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl()Size_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ stepSize_) { .run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->con/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ runRing, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEOp, Algo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ FINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/stidInBlock(threadIdx.x), group(group)izeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buf, | ^~~~~~~~~~~ fSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unr note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads)In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from oll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_2, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_nIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(tcclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hreadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_u8_2, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_2, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hn:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads,UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ &ring->prev, &ring->next10 warnings generated when compiling for host. , work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ runRing(tid, nthreads, wor 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ k); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64_4, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, work->sendbuff, work->recvbuff, work->redOpArg, 0, work->connIndex, work->connIndex); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8_4, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for host. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx908. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 99%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/sendrecv_sum_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/sendrecv_sum_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/sendrecv_sum_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/sendrecv_sum_i8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx1030. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx906. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx1100. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx942. [ 99%] Building CXX object CMakeFiles/rccl.dir/git_version.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/git_version.cpp.o -MF CMakeFiles/rccl.dir/git_version.cpp.o.d -o CMakeFiles/rccl.dir/git_version.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/git_version.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WIn file included from ARP_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] flag1, data2, fl145ag2; | ^~~~~ | uiIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ nt32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, dataIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ 2,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:45:7: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 45 | prims(tid, tn, nullptr, &work->sendRank, work->sendAddr, nullptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:261:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runSend>' requested here 261 | runSend>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:103:7: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 103 | prims(tid, tn, &work->recvRank, nullptr, nullptr, work->recvAddr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:273:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runRecv>' requested here 273 | runRecv>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, : warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:45:7: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 45 | prims(tid, tn, nullptr, &work->sendRank, work->sendAddr, nullptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:261:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runSend>' requested here 261 | runSend>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:45:7: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 45 | prims(tid, tn, nullptr, &work->sendRank, work->sendAddr, nullptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:261:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runSend>' requested here 261 | runSend>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_In file included from SIMPL/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: E]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:45:7: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 45 | prims(tid, tn, In file included from n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11u: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hl:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]l p670 | t r ti,d &work->sendRank, work->sendAddr, nullptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:261:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runSend>' requested here (tid261), nthr | ead s(n threads) , t idI nBl ock (th reardIdxu.x)nS, group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/end>(subtid, subtn, group, work); | NC ^C L_S/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cppTEPS/si:zeo3f(T:) :1 st: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here epSize_3) | D {E FINE_nccl| D ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ e | v group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.hF:u45:7n:c(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSe note: nin instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here d 45 | R e c prvims,(ti d, Ftn,u nunllpctr,S &wuorkm->s,end Ranki, wnorkt->s8e_t, NCCL_ALGO_RndAddr, nullptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:259:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runSend>' requested here 259 | I NG, NC CL_ PR OTOr_SIMuPLEn, 2S) e| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hnd, algo, proto, unrmploe<1l,1,l4>>>(su(bti)d, .subrtn,u grnoup(, w)ork;); | ^ \/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp :3:1 : note: | in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here ^3 | DE/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hFINE_nc:clD670evF:unc15(Se: note: nfield 'nthreads' will be initialized after field 'tidInBlock'dRe 670 | tid(tidcv_)RIN,G_S IMPnLEt_Suhm_i8r_2,e nads(nthreads), tidInBlocclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2)ck(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' | ^670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h : 611: 62t:i dnote: (expanded from macro 'DEFINE_ncclDevFunc't i d611) | , n t hRreuandWsor(knBthartecadhs<)c,o ltli, dtIyn,B lroecdko(tphd,I daxl.gxo),, pgrrootuop,( gurnoruopl)l,> ( )| . ^~~~~~~~~~~r un(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:45:7: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 45 | prims(tid, tn, nullptr, &work->sendRank, work->sendAddr, nullptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:261:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runSend>' requested here 261 | runSend>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:45:7: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 45 | prims(tid, tn,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:45:7: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 45 | prims(tid, tn, nullptr, &work->sendRank, work->sendAddr, nullptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:261:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runSend>' requested here 261 | runSend>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] nullptr, &work->sendRank, work->sendAddr, nullptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:261:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 4>::runSend>' requested here 261 | runSend>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_4, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(g/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hrou/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hp):611:,62: note: expanded from macro 'DEFINE_ncclDevFunc' | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0611 | ?Ru nWonrckBactchl, aclogo,m prmoto,. unbrolul>(f).rfun:670(:15:)S warning: ;iinitializer order does not match the declaration order [-Wreorder-ctor] z\e670 | s [| N ^tiC d(C/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hLtid_), Pn:tRh670rOe:aT15ds(O:nt_ hrnote: Sefield 'nthreads' will be initialized after field 'tidInBlock'aId sM) P, tLi670dEI | n]B l/o Nck (th reatdIdix.xd), gro(up(tgroiup)d, )| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~C, C L_| nST tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_tEP hS/ rsiez671eof | (a T)d :s (nthreads), tidInBlock(threadI sdtepxSiz.e(sxte)pSi,ze_ ==g 0 r? nocculShpmem(.cogmm.rbstuepSfizfe_)S { i | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ z | group(groupe /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:103:7: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 103 | prims(tid, tn, &woroupk), | ^~~~~~~~~~~~~~~~~ -/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:>670:60r: note: efield 'group' will be initialized after field 'stepSize' c670 | v sR [NCa CLnt_PRkiO,dIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:45:7: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 8>, 1>::Primitives' requested here 45 | prims(tid, tn, nullptr, &work->sendRank, work->sendAddr, nullptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:257:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runSend>' requested here 257 | runSend>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nullpt(trid,), nthnreuallptr, work->recvAddr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:273d:s(9nt:hr eanote: dsin instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runRecv>' requested here), t idI273nBTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:103:7: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 103 | prims(tid, tn, &work->recvRank, nullptr, nullptr, work->recvAddr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:271:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runRecv>' requested here 271 | runRecv>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | lo ck (t hr ead I dx. x), grrouup(ngrRouep)c, v | < ^~~~~~~~~~~ ProtoSimple<1,1,COLL_UNROLL>>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:103:7: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 103 | prims(tid, tn, &work->recvRank, nullptr, nullptr, work->recvAddr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:273:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runRecv>' requested here 273 | runRecv>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:103:7: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 103 | prims(tid, tn, &work->recvRank, nullptr, nullptr, work->recvAddr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:273:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runRecv>' requested here 273 | runRecv>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]| group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h :103:7: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 670103 | | pri ms(t id, tn, &tworki->recvRadnk, (nulltptr,i nuldlpt)r, wo,rk- nthreads(nthreads), tidInBlo>reccvAddkr, ( | ^ t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:273:h9In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:45:7: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 45 | prims(tid, tn, nullptr, &work->sendRank, work->sendAddr, nullptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:259:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runSend>' requested here 259 | runSend>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : note: rin instantiation of function template specialization 'RunWorkBatch, 1, 2, 4>::runRecv>' requested here e273 | a d ruIndx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ Re| cv

>(subtid, supSbitzen(s,te pSgizre_o =u= p0 , ? ncclShmem.comm.buffSizes[NCCL_PROTO_SwoIrkM);P L| ^E /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp]:/4:N1:C note: Cin instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here L_ S4 | TDEEFIPNES_n/ccslDievzFuenco(Sfend(ReTc)v _R:IN G_sSItMPeLEp_SSumi_iz8_e4,_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:45:7: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 45 | prim snc(cltFuincdSe,nd Retcvn, ,Fu ncnSuum,l intl8_pt,t NrCC,L_ AL&GOw_RoINrG,k N-CC>L_sPReOTnO_dSIRMaPnLEk, ,4) w| ^o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hr:611:62: note: kexpanded from macro 'DEFINE_ncclDevFunc'-> se ndAd611dr | , nu RunWorllptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:261:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runSend>' requested here 261 | runSendol(l,s utyb, treidd,op u, btalngo,, prgortoo,u upnr,ol l>w()o.rrunk()); ;\ | ^ | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h ^:670 :15/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp: note: field 'nthreads' will be initialized after field 'tidInBlock' : 3670: | 1 : t idnote: (tin instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested hereid ) , nt3hr | eaDdsE(nFthINreEad_ncclDevFunc(SendRecv_RING_SIMPLsE),_ tiSduImn_Bilo8ck(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h_:2,670 n:cc60lF:un cSnote: enfield 'group' will be initialized after field 'stepSize'dR ec v, 670F/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.huncSum, int8_t, NCCL_ALGO_RING, N | C C Lti_d(PtidR)O, nTthOre_adSs(IntMhrPeaLdsE),, t id2In)Bl o c| k(^th re/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hadId:x.611x):, 62gr:ou p(note: g:expanded from macro 'DEFINE_ncclDevFunc'r670 o: 15up:611) | warning: ,initializer order does not match the declaration order [-Wreorder-ctor] R| u ^~~~~~~~~~~ n670 | tid(tid), nthreads(nthreadWso)rk,Ba tcth, algo, pr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:103:7: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 103 | prims(tid, tn, &work->recvRank, nullptr, nullptr, work->recvAddr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:273:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runRecv>' requested here 273 | runRecv>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oto, unrodlIlnB>lo(ck()th.reraduIdnx.x(),) g;ro \ | ^up (g/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hroup:),670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? nc670c | l S htimd(etimd)., cntohrmeamds.(nbthurefadfs)S, itizdIensB[loNckC(tChrLea_dIPdx.RxO), TgrOo_up(SgrIoMPLE]/NCCL_STEPS/sizeof(T) : stepSize_up)), {| ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h| : ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~670: 60: note: | field 'group' will be initialized after field 'stepSize' group(group 670 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h ti:d(45ti:d)7, :nthrea dsnote: (nin instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested heret hr eads), tidInBlock(t45 | h r e aprdIdx.x), group(girmso(tuidp, )tn,, nu ll| pt ^~~~~~~~~~~r, &work->sendRank, work->sendAddr, nullptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:261:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 4>::runSend>' requested here 261 | runSend>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_4, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:45:7: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 45 | prims(tid, tn, nullptr, &work->sendRank, work->sendAddr, nullptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:261:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runSend>' requested here 261 | runSend>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:103:7: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 103 | prims(tid, tn, &work->recvRank, nullptr, nullptr, work->recvAddr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:273:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runRecv>' requested here 273 | runRecv>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid),/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :n670t:h15r: ewarning: ainitializer order does not match the declaration order [-Wreorder-ctor]d s (n670 | t h r e atdisd)(,t itdi)d, nthreads(nthreInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSi/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:45:7: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 45 | prims(tid, tn, nullptr, &work->sendRank, work->sendAddr, nullptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:261:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 4>::runSend>' requested here 261 | runSend>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_4, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RINze(steadps)S, tiidInzBloeck(_thr ead=Idx=.x) , g0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_Sroup(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671G | , NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeIoMPLfE]/(NCCTL_S)TEPS /s:ize of(sT) : stepStizee_) p{ S| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ i | z group(group e/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h_:103):7: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 103 | prims(tid, tn, &work->recvRank, nullptr, | group(group n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.hu:103l:l7: note: pin instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here t103 | r ,pri ms(twork->recvAddr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:273:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 4>::runRecv>' requested here 273 | ruid, tn, &work->recvRank, nullptr, nullptr, work->recvAddr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:273:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runRecv>' requested here 273 | runRecvO>(sLubtiL_UNROLL>>(subtid, subtnd, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SI,M gProuLp, worEk);_ | S ^ u/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cppm:_3:1i: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | 8DEF_INE4_nc,clD evFnuncc(SecndRlecv_FRINuncSenG_dSIMRPLEecv, FuncSum, int8_t, NCCL_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:103:7: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 8>, 1>::Primitives' requested here 103 | prims(tid, tn, &work->recvRank, nullptr, nullptr, work->recvAddr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:269:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runRecv>' requested here 269 | runRecv>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:45:7: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 45 | prims(tid, tn, nullptr, &work->sendRank, work->sendAddr, nullptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:261:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 4>::runSend>' requested here 261 | runSend>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_4, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:103:7: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 103 | prims(tid, tn, &work->recvRank, nullptr, nullptr, work->recvAddr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:271:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runRecv>' requested here 271 | runRecv>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grou/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:45:7: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 45 | prims(tid, tn, nullptr, &work->sendRank, work->sendAddr, nullptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:261:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 4>::runSend>' requested here 261 | runSend>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_4, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:45:7: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 45 | prims(tid, tn, nullptr, &work->sendRank, work->sendAddr, nullptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:261:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 4>::runSend>' requested here 261 | runSend>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_4, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:103:7: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 103 | prims(tid, tn, &work->recvRank, nullptr, nullptr, work->recvAddr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:273:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 4>::runRecv>' requested here 273 | runRecv>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_4, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] group670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:103:7: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 103 | prims(tid, tn, &work->recvRank, nullptr, nullptr, work->recvAddr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:273:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 2>::runRecv>' requested here 273 | runRecv>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_2, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:103:7: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 103 | prims(tid, tn, &work->recvRank, nullptr, nullptr, work->recvAddr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:273:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 4>::runRecv>' requested here 273 | runRecv>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_4, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:45:7: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 45 | prims(tid, tn, nullptr, &work->sendRank, work->sendAddr, nullptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:261:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 4>::runSend>' requested here 261 | runSend>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_4, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:103:7: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 103 | prims(tid, tn, &work->recvRank, nullptr, nullptr, work->recvAddr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:273:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 4>::runRecv>' requested here 273 | runRecv>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_4, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nth/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:103:7: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 103 | prims(tid, tn, &work->recvRank, nullptr, nullptr, work->recvAddr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:273:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 4>::runRecv>' requested here 273 | runRecv>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_4, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, reads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:45:7: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 45 | prims(tid, tn, nullptr, &work->sendRank, work->sendAddr, nullptr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:261:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 4>::runSend>' requested here 261 | runSend>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_4, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 12 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:103:7: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 103 | prims(tid, tn, &work->recvRank, nullptr, nullptr, work->recvAddr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:273:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 4>::runRecv>' requested here 273 | runRecv>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_4, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:103:7: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 103 | prims(tid, tn, &work->recvRank, nullptr, nullptr, work->recvAddr, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/sendrecv.h:273:9: note: in instantiation of function template specialization 'RunWorkBatch, 1, 2, 4>::runRecv>' requested here 273 | runRecv>(subtid, subtn, group, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:4:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8_4, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx942. 12 warnings generated when compiling for gfx1030. 12 warnings generated when compiling for gfx1201. 12 warnings generated when compiling for gfx906. 12 warnings generated when compiling for gfx1102. 12 warnings generated when compiling for gfx1100. 12 warnings generated when compiling for gfx1101. 12 warnings generated when compiling for gfx1200. [100%] Linking CXX shared library librccl.so /usr/bin/cmake -E cmake_link_script CMakeFiles/rccl.dir/link.txt --verbose=1 /usr/bin/cmake -E time /usr/bin/hipcc -fPIC -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -parallel-jobs=1 -Xoffload-linker -mllvm=-amdgpu-kernarg-preload-count=16 -Xlinker --dependency-file=CMakeFiles/rccl.dir/link.d -Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes -shared -Wl,-soname,librccl.so.1 -o librccl.so.1.0 CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o CMakeFiles/rccl.dir/hipify/src/channel.cc.o CMakeFiles/rccl.dir/hipify/src/collectives.cc.o CMakeFiles/rccl.dir/hipify/src/debug.cc.o CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o CMakeFiles/rccl.dir/hipify/src/group.cc.o CMakeFiles/rccl.dir/hipify/src/init.cc.o CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o CMakeFiles/rccl.dir/hipify/src/net.cc.o CMakeFiles/rccl.dir/hipify/src/msccl.cc.o CMakeFiles/rccl.dir/hipify/src/proxy.cc.o CMakeFiles/rccl.dir/hipify/src/rccl_wrap.cc.o CMakeFiles/rccl.dir/hipify/src/register.cc.o CMakeFiles/rccl.dir/hipify/src/transport.cc.o CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o CMakeFiles/rccl.dir/hipify/src/misc/api_trace.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o CMakeFiles/rccl.dir/hipify/src/transport/generic.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o CMakeFiles/rccl.dir/hipify/gensrc/all_gather_sum_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/alltoall_pivot_sum_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/broadcast_sum_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/device_table.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/host_table.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_fclang++: warning: argument unused during compilation: '-Xarch_host -fstack-protector-strong' [-Wunused-command-line-argument] clang++: warning: argument unused during compilation: '-Xarch_host -fcf-protection' [-Wunused-command-line-argument] clang++: warning: argument unused during compilation: '-specs=/usr/lib/rpm/redhat/redhat-package-notes' [-Wunused-command-line-argument] Elapsed time (seconds): 9188.74 16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/sendrecv_sum_i8.cpp.o CMakeFiles/rccl.dir/git_version.cpp.o -fgpu-rdc -ldl /usr/lib64/librocm_smi64.so.1.0 /usr/lib64/libamdhip64.so.6.4.43484 --hip-link --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 /usr/bin/cmake -E cmake_symlink_library librccl.so.1.0 librccl.so.1 librccl.so gmake[2]: Leaving directory '/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build' [100%] Built target rccl gmake[1]: Leaving directory '/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build' /usr/bin/cmake -E cmake_progress_start /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/CMakeFiles 0 + RPM_EC=0 ++ jobs -p + exit 0 Executing(%install): /bin/sh -e /var/tmp/rpm-tmp.9i0DrL + umask 022 + cd /builddir/build/BUILD/rccl-6.4.2-build + '[' /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT '!=' / ']' + rm -rf /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT ++ dirname /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT + mkdir -p /builddir/build/BUILD/rccl-6.4.2-build + mkdir /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT + CFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer ' + export CFLAGS + CXXFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer' + export CXXFLAGS + FFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FFLAGS + FCFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FCFLAGS + VALAFLAGS=-g + export VALAFLAGS + RUSTFLAGS='-Copt-level=3 -Cdebuginfo=2 -Ccodegen-units=1 -Cstrip=none -Cforce-frame-pointers=yes -Clink-arg=-specs=/usr/lib/rpm/redhat/redhat-package-notes --cap-lints=warn' + export RUSTFLAGS + LDFLAGS='-Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes ' + export LDFLAGS + LT_SYS_LIBRARY_PATH=/usr/lib64: + export LT_SYS_LIBRARY_PATH + CC=hipcc + export CC + CXX=hipcc + export CXX + cd rccl-rocm-6.4.2 + DESTDIR=/builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT + /usr/bin/cmake --install redhat-linux-build -- Install configuration: "RelWithDebInfo" -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/lib64/librccl.so.1.0 -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/lib64/librccl.so.1 -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/lib64/librccl.so -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/include/rccl/rccl.h -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/include/rccl/nccl_net.h -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/include/rccl/amd_detail/api_trace.h -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/rccl/msccl-algorithms -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-ll-32tb-op.xml -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-ll-32tb.xml -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-ll-64tb-op.xml -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-ll-64tb.xml -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-simple-op.xml -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-simple.xml -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-simple_2.xml -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/rccl/msccl-algorithms/alltoall-8n-0-9kb.xml -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/rccl/msccl-algorithms/alltoall-8n-190kb-512kb.xml -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/rccl/msccl-algorithms/alltoall-8n-512kb-7mb.xml -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/rccl/msccl-algorithms/alltoall-8n-7mb-43mb.xml -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/rccl/msccl-algorithms/alltoall-8n-9kb-190kb.xml -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/rccl/msccl-unit-test-algorithms -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/rccl/msccl-unit-test-algorithms/all-reduce-ring-ll.xml -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/rccl/msccl-unit-test-algorithms/all-reduce-ring-ll128.xml -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/rccl/msccl-unit-test-algorithms/all-reduce-ring-simple.xml -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/lib64/cmake/rccl/rccl-targets.cmake -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/lib64/cmake/rccl/rccl-targets-relwithdebinfo.cmake -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/lib64/cmake/rccl/rccl-config.cmake -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/lib64/cmake/rccl/rccl-config-version.cmake -- Installing: /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/doc/rccl/LICENSE.txt + echo s@/builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT@@ + find /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/lib64 -name '*.so.*.[0-9]' + sed -f br.sed + find /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/lib64 -name '*.so.[0-9]' + sed -f br.sed + find /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/lib64 -name '*.so' + sed -f br.sed + find /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/lib64 -name '*.cmake' + sed -f br.sed + '[' -f /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/doc/rccl/LICENSE.txt ']' + rm /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/doc/rccl/LICENSE.txt + /usr/bin/find-debuginfo -j2 --strict-build-id -m -i --build-id-seed 6.4.2-1.fc43 --unique-debug-suffix -6.4.2-1.fc43.x86_64 --unique-debug-src-base rccl-6.4.2-1.fc43.x86_64 --run-dwz --dwz-low-mem-die-limit 10000000 --dwz-max-die-limit 110000000 -S debugsourcefiles.list /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2 find-debuginfo: starting Extracting debug info from 1 files DWARF-compressing 1 files dwz: ./usr/lib64/librccl.so.1.0-6.4.2-1.fc43.x86_64.debug: Unknown debugging section .debug_str_offsets sepdebugcrcfix: Updated 0 CRC32s, 1 CRC32s did match. Creating .debug symlinks for symlinks to ELF files Copying sources found by 'debugedit -l' to /usr/src/debug/rccl-6.4.2-1.fc43.x86_64 find-debuginfo: done + /usr/lib/rpm/check-buildroot + /usr/lib/rpm/redhat/brp-ldconfig + /usr/lib/rpm/brp-compress + /usr/lib/rpm/redhat/brp-strip-lto /usr/bin/strip + /usr/lib/rpm/check-rpaths + /usr/lib/rpm/redhat/brp-mangle-shebangs + /usr/lib/rpm/brp-remove-la-files + /usr/lib/rpm/redhat/brp-python-rpm-in-distinfo + env /usr/lib/rpm/redhat/brp-python-bytecompile '' 1 0 -j2 + /usr/lib/rpm/redhat/brp-python-hardlink + /usr/bin/add-determinism --brp -j2 /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT Scanned 38 directories and 316 files, processed 0 inodes, 0 modified (0 replaced + 0 rewritten), 0 unsupported format, 0 errors Reading /builddir/build/BUILD/rccl-6.4.2-build/SPECPARTS/rpm-debuginfo.specpart Processing files: rccl-6.4.2-1.fc43.x86_64 Executing(%license): /bin/sh -e /var/tmp/rpm-tmp.EQjDdd + umask 022 + cd /builddir/build/BUILD/rccl-6.4.2-build + cd rccl-rocm-6.4.2 + LICENSEDIR=/builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/licenses/rccl + export LC_ALL=C.UTF-8 + LC_ALL=C.UTF-8 + export LICENSEDIR + /usr/bin/mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/licenses/rccl + cp -pr /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/LICENSE.txt /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/licenses/rccl + RPM_EC=0 ++ jobs -p + exit 0 Provides: librccl.so.1()(64bit) rccl = 6.4.2-1.fc43 rccl(x86-64) = 6.4.2-1.fc43 Requires(interp): /sbin/ldconfig /sbin/ldconfig Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Requires(post): /sbin/ldconfig Requires(postun): /sbin/ldconfig Requires: glibc >= 2.41.9000-23 ld-linux-x86-64.so.2()(64bit) ld-linux-x86-64.so.2(GLIBC_2.3)(64bit) libamdhip64.so.6()(64bit) libamdhip64.so.6(hip_4.2)(64bit) libamdhip64.so.6(hip_4.3)(64bit) libamdhip64.so.6(hip_4.5)(64bit) libamdhip64.so.6(hip_5.0)(64bit) libamdhip64.so.6(hip_5.3)(64bit) libamdhip64.so.6(hip_6.0)(64bit) libc.so.6()(64bit) libc.so.6(GLIBC_2.10)(64bit) libc.so.6(GLIBC_2.14)(64bit) libc.so.6(GLIBC_2.16)(64bit) libc.so.6(GLIBC_2.17)(64bit) libc.so.6(GLIBC_2.2.5)(64bit) libc.so.6(GLIBC_2.3)(64bit) libc.so.6(GLIBC_2.3.2)(64bit) libc.so.6(GLIBC_2.3.4)(64bit) libc.so.6(GLIBC_2.32)(64bit) libc.so.6(GLIBC_2.33)(64bit) libc.so.6(GLIBC_2.34)(64bit) libc.so.6(GLIBC_2.38)(64bit) libc.so.6(GLIBC_2.4)(64bit) libc.so.6(GLIBC_2.42)(64bit) libc.so.6(GLIBC_2.6)(64bit) libc.so.6(GLIBC_2.7)(64bit) libc.so.6(GLIBC_ABI_DT_RELR)(64bit) libgcc_s.so.1()(64bit) libgcc_s.so.1(GCC_12.0.0)(64bit) libgcc_s.so.1(GCC_3.0)(64bit) libm.so.6()(64bit) libm.so.6(GLIBC_2.2.5)(64bit) librocm_smi64.so.1()(64bit) libstdc++.so.6()(64bit) libstdc++.so.6(CXXABI_1.3)(64bit) libstdc++.so.6(CXXABI_1.3.7)(64bit) libstdc++.so.6(CXXABI_1.3.9)(64bit) libstdc++.so.6(GLIBCXX_3.4)(64bit) libstdc++.so.6(GLIBCXX_3.4.11)(64bit) libstdc++.so.6(GLIBCXX_3.4.18)(64bit) libstdc++.so.6(GLIBCXX_3.4.19)(64bit) libstdc++.so.6(GLIBCXX_3.4.21)(64bit) libstdc++.so.6(GLIBCXX_3.4.22)(64bit) libstdc++.so.6(GLIBCXX_3.4.26)(64bit) libstdc++.so.6(GLIBCXX_3.4.29)(64bit) libstdc++.so.6(GLIBCXX_3.4.30)(64bit) libstdc++.so.6(GLIBCXX_3.4.32)(64bit) libstdc++.so.6(GLIBCXX_3.4.9)(64bit) Processing files: rccl-devel-6.4.2-1.fc43.x86_64 Executing(%doc): /bin/sh -e /var/tmp/rpm-tmp.7qcO3W + umask 022 + cd /builddir/build/BUILD/rccl-6.4.2-build + cd rccl-rocm-6.4.2 + DOCDIR=/builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/doc/rccl-devel + export LC_ALL=C.UTF-8 + LC_ALL=C.UTF-8 + export DOCDIR + /usr/bin/mkdir -p /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/doc/rccl-devel + cp -pr /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/README.md /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT/usr/share/doc/rccl-devel + RPM_EC=0 ++ jobs -p + exit 0 Provides: cmake(rccl) = 2.22.3 rccl-devel = 6.4.2-1.fc43 rccl-devel(x86-64) = 6.4.2-1.fc43 Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Requires: cmake-filesystem(x86-64) librccl.so.1()(64bit) Processing files: rccl-data-6.4.2-1.fc43.noarch Provides: rccl-data = 6.4.2-1.fc43 Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Processing files: rccl-debugsource-6.4.2-1.fc43.x86_64 Provides: rccl-debugsource = 6.4.2-1.fc43 rccl-debugsource(x86-64) = 6.4.2-1.fc43 Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Processing files: rccl-debuginfo-6.4.2-1.fc43.x86_64 Provides: debuginfo(build-id) = 7419e215cbd06f3f129a9977b5b74589ffee1589 librccl.so.1.0-6.4.2-1.fc43.x86_64.debug()(64bit) rccl-debuginfo = 6.4.2-1.fc43 rccl-debuginfo(x86-64) = 6.4.2-1.fc43 Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Recommends: rccl-debugsource(x86-64) = 6.4.2-1.fc43 Checking for unpackaged file(s): /usr/lib/rpm/check-files /builddir/build/BUILD/rccl-6.4.2-build/BUILDROOT Wrote: /builddir/build/RPMS/rccl-data-6.4.2-1.fc43.noarch.rpm Wrote: /builddir/build/RPMS/rccl-debuginfo-6.4.2-1.fc43.x86_64.rpm Wrote: /builddir/build/RPMS/rccl-debugsource-6.4.2-1.fc43.x86_64.rpm Wrote: /builddir/build/RPMS/rccl-devel-6.4.2-1.fc43.x86_64.rpm Wrote: /builddir/build/RPMS/rccl-6.4.2-1.fc43.x86_64.rpm Executing(rmbuild): /bin/sh -e /var/tmp/rpm-tmp.Ou0FEA + umask 022 + cd /builddir/build/BUILD/rccl-6.4.2-build + test -d /builddir/build/BUILD/rccl-6.4.2-build + /usr/bin/chmod -Rf a+rX,u+w,g-w,o-w /builddir/build/BUILD/rccl-6.4.2-build + rm -rf /builddir/build/BUILD/rccl-6.4.2-build + RPM_EC=0 ++ jobs -p + exit 0 Finish: rpmbuild rccl-6.4.2-1.fc43.src.rpm Finish: build phase for rccl-6.4.2-1.fc43.src.rpm INFO: chroot_scan: 1 files copied to /var/lib/copr-rpmbuild/results/chroot_scan INFO: /var/lib/mock/fedora-rawhide-x86_64-1753289447.166372/root/var/log/dnf5.log INFO: chroot_scan: creating tarball /var/lib/copr-rpmbuild/results/chroot_scan.tar.gz /bin/tar: Removing leading `/' from member names INFO: Done(/var/lib/copr-rpmbuild/results/rccl-6.4.2-1.fc43.src.rpm) Config(child) 257 minutes 20 seconds INFO: Results and/or logs in: /var/lib/copr-rpmbuild/results INFO: Cleaning up build root ('cleanup_on_success=True') Start: clean chroot INFO: unmounting tmpfs. Finish: clean chroot Finish: run Running RPMResults tool Package info: { "packages": [ { "name": "rccl-debuginfo", "epoch": null, "version": "6.4.2", "release": "1.fc43", "arch": "x86_64" }, { "name": "rccl", "epoch": null, "version": "6.4.2", "release": "1.fc43", "arch": "x86_64" }, { "name": "rccl-debugsource", "epoch": null, "version": "6.4.2", "release": "1.fc43", "arch": "x86_64" }, { "name": "rccl", "epoch": null, "version": "6.4.2", "release": "1.fc43", "arch": "src" }, { "name": "rccl-devel", "epoch": null, "version": "6.4.2", "release": "1.fc43", "arch": "x86_64" }, { "name": "rccl-data", "epoch": null, "version": "6.4.2", "release": "1.fc43", "arch": "noarch" } ] } RPMResults finished

_(S)I.MrPuLnE(]t/idN,C CsLu_bStTnE,P Sw/osrikz)e;o f (| T) ^ : stepSiz/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cppe:_17): 1{: note: | in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 17 | DEFINE_ncclD/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.he:254v:F90u:n cnote: (in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested hereAl lReduce _254T | R EE _ S I MPPrLiEm_iPtriovde_sf<6T4,_ 4R,e dnOcpc,l FFuanncAAslylmmReedturicce<, NFCCuLnc_PMArXod_,DE Vdo_AuRbIlTeY,, N1C>C,L _A/L*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ GO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_2, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInB/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, dou:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ble, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64_4, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx908. 21 warnings generated when compiling for gfx942. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1201. 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1200. [ 64%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 21 warnings generated when compiling for gfx942. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uinIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2t32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: :218unused variable 'w' [-Wunused-variable]:15: warning: unused variable 'bid' [-Wunused-variable] 21880 | | c ons t i n barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ t bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hunused variable 'bid' [-Wunused-variable]: 366218 | :15: warning: unused variable 'bid' [-Wunused-variable] 366 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ [ 64%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u32.cpp.o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtnIn file included from , work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProdIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ , rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.htidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ >, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_2, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ d), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, prot/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), no, unrotll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(g/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ roup), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8_4, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelIddata2, flag2; | ^~~~~ - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from :366:15In file included from : warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, u/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h).run(); \ | ^ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ L>, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nth rnecacdlsF(unntchArlelaRdesd)u,c et,i dFIunnBclPorcokd(,t hurienatd3I2d_xt.,x )N,C CgLr_oAuLpG(Og_rToRuEpE),, N C| C ^~~~~~~~~~~~~~~~~L _PR/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hO:T670O:_60S:I Mnote: Pfield 'group' will be initialized after field 'stepSize'L E, 4) 670| | ^ tid(ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hd:)611,: 62n:t hnote: rexpanded from macro 'DEFINE_ncclDevFunc'e ads(nth r611e | a d s ) ,R utniWdoIrnkBBlaotcckh((,g raolugpo),, p r| o ^~~~~~~~~~~t o, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_2, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | R), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ unWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.c/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Protoomm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ edOp, Proto, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SI_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ MPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().rkun(tid, s(ubtn,t work); h | ^ re/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:a22dIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ :1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 67122 | DEFIN | E_ncclDevFunc stepSize(stepSize_(Al lRedu=ce_RI=NG_SIM PLE0_Pr ?od _u32_n4cc,l nShmecclFmun.cAlclomm.buReducfefS, iFzuencsProd, uint32_t, NCCL_ALGO_RIN[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | G, NCCL _PRPOTO_SrIMPiLE,m 4) i| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.ht:611:62: inote: expanded from macro 'DEFINE_ncclDevFunc' v611 | e RunsWorkBr,i acl<1>, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested herego, p roto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthr 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | eads( nthr eads), tidInBlock(thre adIdxi.x), gfrou p(g(routp), i| ^~~~~~~~~~~~~~~~~d /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670 :60: note: | ().run(tid ^~~~~~~~~~~, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32_4, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1201. 1717 warnings generated when compiling for gfx1102. warnings generated when compiling for gfx908. 21 warnings generated when compiling for gfx942. 21 warnings generated when compiling for gfx90a. [ 64%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 21 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t dataIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp1, flag:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 1, data2, flag2; In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \Idx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmeIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ m.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId -/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ work-In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ >channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid),In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitive nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ s, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gro group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here eads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ op, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2 | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.b0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here<1>, 0, Proto, 0> prims | ^ 254/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | | runRi ng(tid, nthreParimitives, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWoTY, 1>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runrkCoTll(w).runn(tid<, subTtn, w,ork); R| ^edOp, ProtoSimple<1, 1, COLL_UNROLL>, COLL_U N/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested hereR 12O | DLELFI>NE_ncclDev(Func(tAlliRd, nthreads, work); | educe_RING_SIMPLE_Prod_u64_2, ncclFuncA ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtnll,Redu ce,w FuncoProd, ruint6k4_t), N;CCL_A LGO_RING , NC| CL_PROTO ^_SIM PLE, 2) /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62:: note: expanded from macro 'DEFINE_ncclDevFunc' 7 611: | RunWo1rkBatc:h, 0, 2, 2>::run' requested heret y , r7e | dDoEFINE_ncclDevFunc(p, algo, proto, unroll>().rAllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | un(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h: 670:15 : note: Rfield 'nthreads' will be initialized after field 'tidInBlock' u670 | n W toid(tird), nkthreaBds(nthareadst), ticdInBlhoc, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(htireda)ds(,nth readnst),h tirdIneBlaodck(sthre(adIndxt.x)h, grrouep(garoudp),s )| ^~~~~~~~~~~, tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? nc.buffSi/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid),pDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ zes[NCCL_PROTO_SIMPLE]/NCCL nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grou /p*Dire)ct=*,/0, P roto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nt h| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ r| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671e | a stdepSisze(st,epSi ze_ =w= 0 ?o ncclrShmemk.com)m.buff;Size s[NCCL_PR OTO_S| IMPLE ^]/NC CL_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hSTEPS/sizeo:f432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Pr | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_nccDEVl_ARIDTY>,e /*DvirFecut=*/n0, Pcroto(, 0>A lprlimsR | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5:e note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here d 565 | u runTreeUpDown, aCOLL_tUNROcLL>(htid,< nthcreados, wlork)l; | , ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h: 432:78t: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | y , i f (tride d< soubtnp) RunFn, T, RedOp, Algo, Proto, COLL_UNROLL>().run(tid, su, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlockb(tn, tworkh); r| e ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7a:1: note: din instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here I7 | DdEFINE_nxcclDevFu.nc(AxllRe)duce_,TREE _SIgMPLEr_Prood_u64u_2, pnccl(FgurnocuApll)R,e | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tiduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hd(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), n:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ threads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nt/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWohrrkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eads(nthreads), tidInBlock(threadIdx.x), group(group1062) | , run Ring( tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_tid , n threads,671 work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h | Primitiroto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ ves, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing ste(pSizte(stiepSidze_ ,== 0 ? nncclShmetm.chommr.beufadfSsi, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: zes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl{( | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ )| group(group ./builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:r63:56u: note: nin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here (63 | t i d P,rim itisvesu, ;0 , | ^Pr ot/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cppo,:12 :1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevF0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(Etid,, nth2rea)ds, wo rk); | ^ | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h^:432: 78:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432: | 611 : 62 : if (tinote: d (u)nWo.rkrBatunch(, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x)| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62, group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : note: expanded from macro 'DEFINE_ncclDevFunc' 611 | group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tid I n BRluonWocrkBkatc(hI, adlgox, prot.o,x unroll>()),. rgurno(up); (g\ ro u| ^p /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h), : | 670 ^~~~~~~~~~~:15 : note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nth/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:reads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.c/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] omm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | Pr tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Algo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_2, ncclFuncAllRedu group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? nc:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>MPL(E]/NCCL_tSTEPS/siizeof(T)d : stepSize_) {, | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hn:254:90t: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here h 254 | r Priemitivesa, /*Direct=*/| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl prim,s | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hC:565O:5: note: Lin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565L | run_TreUeUpDNownROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: , 0, 2, 4>::run' requested herep, Pr oto Simple17< | 1, 1D, COLEL_UNRFOLL>,I COLLN_EUN_nRcOLcLl>DevFu(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78nc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_A: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested hereL 432G | O _ iTf (tRid :611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(A redop, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIlldReduxce_T.REE_xSIMP)LE_,Prod _u64g_4r, noccluFuncpAllR(educge, FurncProod, uuintp64_)t, NC,CL _ALGO_TREE, NCCL_PRO| TO_S ^~~~~~~~~~~~~~~~~IMPL E, 4) | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62:: note: 670:60: note: field 'group' will be initialized after field 'stepSize'expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ ,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads),In file included from tidInBlock(threadIdx/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().runIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), ()t; \ | i ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670d:15: note: field 'nthreads' will be initialized after field 'tidInBlock'I nBlock(thr 670 | e tiad(tid)d, nthreIads(ndthreadxs), .tidInBlock(thrxeadIdx).x), ,group( group(ggrorup),oup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | s tepSize(stepSitid(tid), nthreads(nthreads), tidInze_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63Bloc | k(thr eadIdx. x), gr oup(gr oup),P | ^~~~~~~~~~~ rimitives, 0, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreadsProto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_2, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hst:670:15e: warning: pinitializer order does not match the declaration order [-Wreorder-ctor] S670 | i tizd(tied), _nthr eads=(nth=reads ),0 ti? ndcIcnBllSohcmke(mt.hrceomamdI.bduxf.fSx),i zegrosu[Np(CCgL_rouPpR)O,T O _SIMPLE]/NCCL| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSiz_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitivesin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here, /63* | D irect=*/0, Proto, 0> prims | ^ Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ etric<1>, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h558:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, ProtoSimple<2, 2, 4>, 4>' requested hereOLL_UNROL L>558 | ().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_nccl D runRingn(tidc, nt(hreadAs, wlork);l | ^R /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.he:432:78:d note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here u 432 | c e_TR iEfE_SIMPLE_P (rto/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] id d< s 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _u64ub_4,tn )ncclFu RunWorkColl ( ).| ru^n( ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hd, s:ub611tn:, 62wo:rk note: )expanded from macro 'DEFINE_ncclDevFunc'; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp611:22 | : 1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here R22u | nWorDkBaEtFIcNhE<_ncolccll, Detvy, rFeduonc(pA, algo, proto, unroll>().run()llR; educe_RING_SIMPLE_Prod_u64_4, ncclFuncAllReduc\e , FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), L_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdPROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ x.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group _/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ T, RedOp, FanSymmetric<1>, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buff 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Sizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64_4, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1030. [ 65%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:In file included from 2/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ : warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | constIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ LE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl ( ) . rtuind((ttiidd,) ,s unbtthnr,e awdosr(kn)t;h r e| a ^d s), tidInB/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:l7o:c1k:( tnote: hin instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested herer eadIdx.x) ,7 | gDrEoFuIpN(Eg_rnocucpl)D,e v F| u ^~~~~~~~~~~n c(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group),In file included from | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Pro/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | ), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_2, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670: 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBloc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tik(dthrea(dIdx.x)t, grouip(groudp), | ) ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ , 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ RedOp, FanAsymmetric<1, NCCL_MAX_DEV_ARITY>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1101. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | warnings generated when compiling for gfx1100. tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for host. 17 warnings generated when compiling for gfx1030. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8_4, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1200. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 65%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ 2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, dIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WAaRP_SItZaE2;, \f l a| g ^2 ; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARPIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ _SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->chaIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ nnelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_2, ncIn file included from cl/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cppF:u2n: cIn file included from A/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hl:l11R: educe, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ [NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(In file included from threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | Run/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads),WorkBa ttcihd),, aglrgoou,p (pgrrootuop,) ,u n r| o ^~~~~~~~~~~~~~~~~l l>().run/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h(:)670;: 60\: note: | field 'group' will be initialized after field 'stepSize' ^ 670 | tid(tid), nth/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hr:e670a:d15s:( nnote: tfield 'nthreads' will be initialized after field 'tidInBlock'h reads), tidIn B670l | oc k ( t htrieda(dtIiddx).,x )n,t hgrreoaudps((gnrtohurpe)a,d s )| , ^~~~~~~~~~~ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_2, ncclFuncAllReduc:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ e, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_4, ncclFuncAl/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here lReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bf/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ adIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_2, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.c/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreadomm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ s, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16_4, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx908. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 65%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShme/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ m.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | cons/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ t int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14:7 warning: unused variable 'data1' [-Wunused-variable] 145 | : uint 32_t datwarning: a1, flagunused variable 'w' [-Wunused-variable]1, data2 , flag2; | ^~~~~ 75 | barrIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ier_by_group();/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145: 21: warning: unused variable 'flag1' [-Wunused-variable] 145 | u| int32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const iIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ nt w = threadIdx.x/WARP_SIZE; \ | ^ In file included from 2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channel/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ Id - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShm/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hem.channelId - work->channelLo; | ^~~ :218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] : note: expanded from macro 'barrier_by_group' 29 | 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tIn file included from idInBlock(thre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:a175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.hdIdx.x), group:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]( 496 | g roup), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->doIn file included from w/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ n, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); In file included from | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncc/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:l2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:D11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:e173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670v:15: warning: Finitializer order does not match the declaration order [-Wreorder-ctor] u670 | n tid(ctid),( nthrAeadIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncs(lnthrelads),R tideInBduce_loTck(threadIdREE_Lx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ L1 28_Su| m_bf8 tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize__2, nc clFun cAll671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSReduice, FzuncSume, rccl_bfloat8, NCCL_ALGAOllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatchPS/s,izeo f(aT) :l stegpSizeo_) {, p | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ r | group(groupoto, unroll>().run(); \ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> | p ^ rims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIn file included from Idx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp254:2: In file included from :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: 90In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173:: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670: 15: warning: note: initializer order does not match the declaration order [-Wreorder-ctor] in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here670 | tid(tid)254, nt | hrea ds(n threads) , t PriimdInBilocktives, /*Direct=(*thre/adIdx0.x),, gr oup(gProupr), o | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ t | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ o 671 | , step0Size(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_S> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h(:t254:90:i note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here d 254, | Pnrimittivehsreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432, 0, 2, 2>::run' requested heremetr ic< NC432 | if (tid < subtn) RunWoCLr_MAX_DEV_ARITY, 1>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:kC5oll<:Fn, T, RedOp, Algo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPL Enote: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here _565 | S ruunTremeUpD_ownb, FCOLLu_UNRnOLL>c(tidA, ntlhrealds,R eworkd); u| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hc:432e:78: ,note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | F uncSum, rccl_b f ifl (tiod , algo, proto, unroll>(o, )Prot.o, CrOLL_uUNROLL>().run(tind, (su)b;tn , \wo rk );| ^| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:7::1670: :note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here15 : 7note: | Dfield 'nthreads' will be initialized after field 'tidInBlock'EF IN E_nc670cl | De vF u nc (AtlliReddu(cet_TiREdE_SIMP)LE,_S umn_thbfr8_e2,a ncdcslF(unncAtllhRerduece, FuncSum, rccla_dsb),f tlidIonat8, NCCL_ALGO_TREE, NBlock(threadIdx.x), group(group), CCL_P| RO ^~~~~~~~~~~~~~~~~TO _/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hSI:MP670LE, :2)60 : note: field 'group' will be initialized after field 'stepSize' | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h670:611: | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.62:x note: )expanded from macro 'DEFINE_ncclDevFunc' , 611 | g r RounuWpor(kBgatrcho, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(thre_STaEPS/sidzeof(T) :I stepSized_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~x | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h.:303:90:x), note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Prot groupo(group), , | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | 0 stepSize>(stepSiz e_ == 0p ? ncclShrmem.commi.buffSimzes[NCCLs_PROTO_ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:SIMPLE]/NCC565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | L_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303: r90unTr:eeUpD own, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here, Pro toSim ple<1, 1,303 COLL | Primitives<_UNROLL>, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | T, RedO p, iFanAfs (tid ymm,n) RunWorkColl prtims o| , COLL_UN ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown(),.run (tid,C subOtn, LworkL); _| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cppU:7:N1: note: Rin instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here O7 | DELL>, COLL_UNROLFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL>(L_PROTO_SIMPLE, 2) | ^tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h | :611:D62: Enote: expanded from macro 'DEFINE_ncclDevFunc' 611 | F I RuNnWoErkB_atcnh,F algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | un c( AltlRiedudce_T(REEt_SIiMPLEd_Su)m_b,f8_ 2, nnccltFunhcAlrlReeducae, dFunsc(Snthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch), ,nthr eadas(nlthrgeados),, tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Pri/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gr| o stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | u warpIpnBlock((threadgIdx.x/WroARP_SIuZE), p| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ) warp(tid/WARP_SIZE 498 | , fla | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ gThrea671d((ti | d%4)== 3), gr oup( stepSize(stepgroSup),i | z ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 e 499 | _ stepS ize(n=c= cl0 ? ncclShmem.Shmcem.comom.buffSimzes[Nm.buffSmitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ izes[NCCL_PROTO_LL128]/NCCL_STEPCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here S63/size | of(ui nt64_ t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group P/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63r:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here i 63 | m Pirimititves, 0,y Promtmetric<1>, 0, o, P0> prirms | o ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hto, 0> prims :1062:5:| note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here ^1062 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runR ing(tid, nProto, COLL_UNROLL>(tidthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ , nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBloIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ck(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads),/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nt wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ hreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group id), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ .x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ MAX_DEV_ARITY>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 1, COLL_UNROLL>, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(g/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(th/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hreadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ :| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 670671 | :stepSi15ze(ste:pSize_ == 0warning: ? nccinitializer order does not match the declaration order [-Wreorder-ctor]lShm em.com m.buf670 | fSiz tid(tides)[NCCL_,PROTO nthre_SIMPLads(E]/n/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), threNCCLa_dSTEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | s), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMP LE]/NCCL P_rimSitivesTe, /*Diroect=*/f0, Pro(to,T) : stepSize_) 0> pri{ms | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565 :5| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | , COLL _UN RO LL>(rtid,u nthnreadRs, wiornk); g | (tid, nthrnote: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested heree 432 | a d sif (,ti d < wsubotn) rRunkWo); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: rkColl, 1, 2, 4>::run' requested here, R edOp , A432 | lgo, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(A if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ llReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTree/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hUpDown, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), groupedOp, ProtoSimple<1, 1, COLL_UNROLL>, COLL_UNROLL>(tid, nthre/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) Run:670W:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]o 670 | r tid(ktid), Cnthreados(nthll().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: grin instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested hereoup( group ), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ 17 | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ | 671 | D stepESize(FstepISize_N == 0 E? ncc_lShmencclDevFunc(AllReduce_TREE_Sm.coImm.buMffSizePs[NCCLL_PROTO_SIMPLE_Sum_bf8_4, ncE]/cNCCL_SlTEPS/Fsizeouf(ncAllReduce, FuncSum, rccl_bfloat8, NT) : CstepSCize_) L{ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~_ | group(group A/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:LGO_TRE90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*kDirBect=a*/0,tch, algo, proto P,roto , 0>u prinms r| ^o /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:l565:5:l note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here >565 | ( r)u.run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | n Tree UpDotwn,h COLrLeads), tidInB_UNROLL>(tid, nthreads,lock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nt wohrk)r; e| ^ ads/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432(:78:n note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested heret h432 | r e iaf (dtids < )subt,n) RuntWorikCodll( ).run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PRO:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? nTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ cclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, N/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_CCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto,s(nth reads), 0tidInBlo>ck(thre adIdx.x)prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | , group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? n runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid , FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here _303 | U PriNmitROLL>().run(tidive,s,n, wo rk); | / ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here * 22 | DEFDINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloirect=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ at8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | ), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primit iPrimitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ves, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work);r oup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nth_PROTO_Sreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreaIMPLE]/NCCL_STEPS/sizeof(T) : sds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, s17ubtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_2, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RI warnings generatedN when compiling for host. G, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8_4, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx906. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 65%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cppIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ :1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | b/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: arrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | counused variable 'w' [-Wunused-variable]n 75 | s barrietr_by_gro up(); | i ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.hnt w = threadIdx.x/WARP_SIZE; \ | ^ :29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from :366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_g/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ roup(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2a: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: tIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:a145:14: 2warning: unused variable 'data1' [-Wunused-variable] 145 | , ui nt32_tf datal1, flaga1, datga2, fl2ag2; ;| ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h: 145:21: warning: unused variable 'flag1' [-Wunused-variable] 145| | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_In file included from by_group();/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] :15: warning: unused variable 'bid' [-Wunused-variable] 27 | 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ const int bid = ncclShmeIn file included from m.channelId - w/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14o: warning: unused variable 'data1' [-Wunused-variable]r 145 | k - uin>t32_t cdata1h, flaag1, danta2, nflag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flagIn file included from 1/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: ,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15 : warning: unused variable 'bid' [-Wunused-variable] d27 | a cotnst iant bid = ncclShmem.channelId - work->channelLo; | ^~~ elLo; | ^~~ 2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp,:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from f/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: l/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75a:7: warning: gunused variable 'w' [-Wunused-variable] 751 | , barr ier_bdy_groaup(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:t15: note: expanded from macro 'barrier_by_group' a 29 | 2 co,nst in t w =f threladIdxa.x/WgARP/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h2; | ^~~~~ _SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = n:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ ccl/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cppS:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ hmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channel:366L:15: owarning: unused variable 'bid' [-Wunused-variable] ; 366 | cons| t int ^~~ bi d = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ : In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barriIn file included from er_by_group(); /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group| ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h(:29:15: note: expanded from macro 'barrier_by_group') 29 | const int w = thr;eadIdx.x/WA RP_SIZE; \ | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' | ^ 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ 2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ flag1, data2, flag2; /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barriIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ er_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid =:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint3/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | c2_t daota1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ nst int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h,: 670t:i15d:I nwarning: Binitializer order does not match the declaration order [-Wreorder-ctor]l ock(threadIdx. x670) | , g r otuipd((gtriodu)p,) ,n t h| r ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~e a d| s tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_( nthreads )671, | t i d IsntBelpoScikz(et(hsrteeapdSIidzxe._x )=,= g0r o?u pn(cgcrloSuhpm)e,m . c| o ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~m m .| b tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_u ffSizes[ N671C | C L _ P RsOtTeOp_SSiIzMeP(LsEt]e/pNSCiCzLe__S T=E=P S0/ s?i znecocfl(STh)m e:m .comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), sgrtoeuppS(igzreo_u)p ){, | | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~~~~~~~ | group(group/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(ti/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hd:)63,: 56n:t hnote: rin instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested heree ads(nt h63r | e a d s )P,r itmiidtIinvBelso, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ .x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, nccl ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ FuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInB/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(lock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid),:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ etric<1, NCCL_MAX_DEV_ARITY>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nt 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_2, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16_4, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx942. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1200. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx942. [ 66%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx./builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | In file included from ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group'/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h: 173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: In file included from 29 | conwarning: unused variable 'w' [-Wunused-variable]s 75 | t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h :11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:i173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h: 75n:7t w = threadIdx.x/WARP_Sbarrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:: warning: 15unused variable 'w' [-Wunused-variable] 75 | : note: expanded from macro 'barrier_by_group' barrie29r_by_ | group() ; | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15 : const int w =note: expanded from macro 'barrier_by_group' 29 | const int w = threadIZE; \ | ^ threadIdx.x/WARP_SIZE; \ | ^ Idx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_grouIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from p(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h); : | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp174 ^~~~~~~~~~~~~~~~~~ :/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | :29: 15: note: expanded from macro 'barrier_by_group' 29 | const int:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const in batrrier _by_growup(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h=:29:15: note: expanded from macro 'barrier_by_group' 29 | t conhst int rw = thereadaIdx.x/dWARP_Idx.x/WSIZEA; \ | R P_SI ^ Zw = tEhreadI; \ | ^ dx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1145 | , uint3 2_t dadta1,a flagta2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.hIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :145:1,21 data:2, fl ag2; warning: | ^~~~~ unused variable 'flag1' [-Wunused-variable]/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145: 21: warning: unused variable 'flag1' [-Wunused-variable] 145 | u145int32_ | t dat a1, f lag1, da tau2, iflagn2; t| ^~~~~ 3/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: 2warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, _t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] flag1451, da | ta 2, fl ag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h: 145:35: warning: uunused variable 'flag2' [-Wunused-variable] 145 | i uinnt32_tt d3ata1, 2flag1_, datt data1, flag1a2, flag2; | ^~~~~ , data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const inIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ t bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, work->sendbuff, work->recvbuff, work->redOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ 670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*DireIn file included from ct=*/0, /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cppProto:, 02: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11> p: rimsIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565 :5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 496 | 565 | runTreeUpDown, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nthreads), wid(tid%WARP_SIedOp,Z ProtEoSimpl)e<1, ,1, CO LL_UNwarp(tid/WROALL>, RCOLL_UPN_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | R OLL>( tid, nthr eads,w worka); rpInBlock(th| ^ r/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432e:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested herea dIdx.x/WARPIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_432 | S IifZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ( warp(tid/WARP_SIZEtid _Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ < subt498n) | Ru n Wor k flagThread((Coll()f.run(tid, Ssubitn,z eworsk);[ | N ^ C/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:C7:1:L note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here_ P7 | RDOEFITNE_On_LL128]/NCCL_STEccPlDeSvFu/nc(sAillzReeducoe_f(uint6TR4EE_S_IMPtLE_)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:421:Su9m:_f 32_note: 2,in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here nc clF uncAll421Re | duce, FuncSum, floa t , N pCriCmsL(t_idA, nthreads,L GO_TRtree->doEE, NCwCLn_P,RO TOtree->down, work->send_bSIuMPfLE, 2) f ,| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:w611:o62:r note: kexpanded from macro 'DEFINE_ncclDevFunc' - >611 | r e cRuvnWborukBfatfc, whredOpArg); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: lnote: lin instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here, ty , r1070ed | op , arlugno,T prroetoe, uSnrpolll>i()t.rd(), nthretid, nthreads, waodsr(nkth)re;ad s) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives),( n)th.reradus(nn(tthrieadds,),_MAX_DEV_ARITY, 1>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tidsInuBlboctk(nth,re adIwodxr.xk),) g;roup( g r| ^oup), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZEIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ , &tree->up, work->sendbuff, work->recvbuff, work->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, work->sendbuff, work->recvbuff, | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1070:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1070 | runTreeSplit(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWorkBatch, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn):670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(thre RuanWordkColIl( | ).ru n(ti d, s ubtn , wsork)t; e pSize(stepSize_ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp=:7:=1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | 0 ? nccDEFlINE_Snchmem.comm.buffSizes[clDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, ncclNCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives,, 2) | ^0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611: 62: note: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hexpanded from macro 'DEFINE_ncclDevFunc' 611 | :RunW558orkB:atch<5col:l, t note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here y, redop, algo, proto, unrol558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < slu>(b).trnu)n( );R \u | n ^ W/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.ho:670r:15k: Cnote: field 'nthreads' will be initialized after field 'tidInBlock'o l670l | < F tnid,(t idT),, nt hrReeaddsO(npt,h reAadls), gtiodI,nB loPckr(tohrteao, dICdxO.xL),L group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), n_tUNhROrLL>e()a.rduns(t(idn, tsuhbtrn,e waork);ds) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncc,l tiDdInBloeckv(tFhrueandIcdx(.xA),l grlouRp(egrdouupc)e, _| ^~~~~~~~~~~R ING_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, floa432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_)/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, ncclFunc { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | ruAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | n cclD evFu nc(AllRedutce_TiREEd_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, (tid), nthreads(nthreads), tidInBlock(threadIdx.x), groflouat, pNCCL(_ALGgO_TREE, NCCLr_PROoup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSiTO_SIMPLE, z2) e| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h_:611 :62: note: =expanded from macro 'DEFINE_ncclDevFunc' = 611 | 0Run Wor?kBat ncclShmem.comm.buffSizes[NCCL_PROTO_Sch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock'IM PL E]/NCC670L_S | TEP S/s izeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ ti d(t id| ), group(groupnth rea/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hd:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives(snth, /*Direct=*/0, Proto, 0> up(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x)prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, p/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreroto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Block(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gT) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prroupi(groump), s | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | st| epSize ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here (stepSize_ == 0 ? ncclShmem.comm 565 | runTreeUp.DowbuffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : snt,_ COLL_)UNROL L>(t{id, | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group nt hreads/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h,:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1101. /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Protin instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ o, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp17 warnings generated when compiling for gfx906. :17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:611:62::670 :15note: expanded from macro 'DEFINE_ncclDevFunc' In file included from :611/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp | :warning: initializer order does not match the declaration order [-Wreorder-ctor] 2 : In file included from 670/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hR | unWorkBatchi,d, )nta,hrl eagndsot(n,hth rrpeearados), tdtiosdI,(nBn lotuckh(thrreaedaIddx.sx), tidInBlock(threadIdx.x), group(group), | ) ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~, gr ou| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_p (g rou671p | ), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ s | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ t671 | stenroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ pSize(stepSize_ == 0 ? nccepSize(stepSize_ =l=Sh m0em .c?o nmcclShmem.comm.buffSizes[NCCL/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] _PROTmO.b_uffSSiIzeMs[PNCLCLE_P]RO/TON_SCIMCPLLE]_/NSCCTL_ESTPES/PSs/siizzeoef(oT) f: (stTe)pS i:z stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Per_)i {m i| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(groupt iv/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.he:63s:56<: Tnote: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here, 63 | R e dPrOimpit,i veFs, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1062 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ FanSymmetric<1>, 0, Proto,symmetric, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _> MprAimX_DEV_ARITY, 1>, /*Dis r | e ^ c/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.ht:558=:5*/: 0note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here, 558 | P ro truonR,in g prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:ed5Op:, Pnote: rin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested hereoto , COL565L | _ UN RO LL >(rtiud,n nTthrreeeUpDown, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ :m78:p note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested herel e<1, 1, COLL_UNROLL>, COLL_UNROLL>(tid, nthr432 | if (tid < subtn) RunWorkColl, 0, 2, 2>::run' requested here 432 | dO p, Ailgfo, P(rottoi, dC OL(t).nru)n(t iRd,u nsWubotnr, kwoCrk)o; l | l ^ , 1, 2, 2>::run' requested hereC O 12L | DLEF_INUE_NncRclDevFOunLc(LAl>lR(ed)uc.e_rRIuNGn_S(tid, subtInMP,LE _Swumo_fr32k_)2;, ncc lF | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:un1cA:ll Renote: duin instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested herece , Fu7nc | Sum, float,DEFINE_ncclDevFunc(AllR eNCdCLu_AcLGeO__RTINRG, ENECC_L_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NPRCOTCO_LSI_MPALEL, G2)O | _^T /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.hR:E611:62E: ,note: expanded from macro 'DEFINE_ncclDevFunc' N611 | C C LRu_nWPorRkBOatcThO,2 a)lg o, p| ro^to ,/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h unr:ol611:62l>:() .rnote: unexpanded from macro 'DEFINE_ncclDevFunc'() ; \ 611| ^ | RunWorkBatch ,e adasl(gont, hpreraodtso),, utnirdoIlnlB>l(o)c.kr(utnh(r)e;a d\I d x| . ^x )/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h, :g670r:o15u:p (note: gfield 'nthreads' will be initialized after field 'tidInBlock' r ou670p | ) , | tid ^~~~~~~~~~~~~~~~~( t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hid:)670,: 60n:t hnote: rfield 'group' will be initialized after field 'stepSize'e a ds670( | n t h r etaidds(t)i, dt)i,d InntBhlroecakd(tsh(rnetahdrIedxa.dxs)),, gtroiudpI(ngBrlooucpk)(,t h r| e ^~~~~~~~~~~~~~~~~a d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hId:x.670x:)60,: gnote: rfield 'group' will be initialized after field 'stepSize' ou p670( | g r o utipd()t,i d )| , ^~~~~~~~~~~ nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:498:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 496 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 497 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 498 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 499 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROIn file included from TO/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from _/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: LIn file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hL:670:15:1 warning: 2initializer order does not match the declaration order [-Wreorder-ctor] 8 670 | ] tid/(tid)N, nthCreadsC(ntL_STEPhSread/s),sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ ti dInBlock(threadIdx.x), gr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepoup(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:1062:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested hereste pSi ze(step1062Si | ze_ = = 0 ? ncc Size_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ runRing]/NCCL_STEP(S/sizteof(Ti) :d step,Size_ ) { n| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group t/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254h:90: note: rin instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here eads254 | Primitives, 1, 1, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:10:1: note: in instantiation of member function 'RunWorkBatch, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllRedc, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:uce_RING_LL128_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 432:78: note: 611in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here | 432 | i f (t id < subRtn) unWorkBatch()y.ru>n(t,id, subatn,l wogrk)o; ,| ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp :7:p1: rnote: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here o 7t | DEoFIN/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~, unrollE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, >().run(); \ | ^ ncclFuncAllReduce, FuncSum , | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(ti =d= ,0 s? uncbcltShnme,m.comm .buwffoSirzeks[)NC;CL _P R| OT ^O_ SI/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cppMPLE:]/12NC:CL1_S:TEP Snote: /in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested heresi z eof(12T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | | group(groupDE FI/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hNE_nc:c254lDe:vF90u: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives,nc(AllReduce_RING_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78:y >note: , in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested hereal g o, p432ro | to , un rol l> () .riunf() ; (\ t | i ^ d/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h :670<:15: note: field 'nthreads' will be initialized after field 'tidInBlock' s 670 | tid(tid), nthreads(nthreads), tidInBlock(threaubdtnI) dRuxnW.orxkC)ol,l< Fng, Tr,o RuedpOp(, gAlroup), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads),go, Proto, COLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSu tmid,In Block(threadIdx.x), group(group), | ^~~~~~~~~~~ float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthr/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | , RedOp, FanSymmetric<1>, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | run:R670:15:i warning: initializer order does not match the declaration order [-Wreorder-ctor] n 670 | g , algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ stepLSize(_stepSUize_ N=ROL= 0 ? nccL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RluShmenm.coWmm.bouffSrizesk[NCCCL_PROoTO_SlIMPLlE]/N().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here63 :56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | 12 P | rimiDtivesE, c0, Pcroto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested herelDevFunc(AllReduce_RING_SIMPLE_Sum_f32_2, ncclFuncAllRedu 558c | reunRin,g(tmid, ,nthr eadsf, wolrk); o | ^ a/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.ht, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: :432:expanded from macro 'DEFINE_ncclDevFunc'78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 611 | RunWorkBatch < c432 | o l l ,i f t(tyid, < srubetnd) oRupnWl<,F na, Tl, RedOp, Algo, Proto, COLL_UNROLL>().run(tid, subtn,go, proto, unroll>().run() w;or k)\; | ^ | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp ^: 22:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h1: note: :in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 670 :22 | 15DEFIN:E_n ccnote: lDfield 'nthreads' will be initialized after field 'tidInBlock'ev F670un | c( A tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads)l,lReduce_RING_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkB tidIn17Block(threadI warningds generated when compiling for host. x.x), group(group), | ^~~~~~~~~~~ atch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32_2, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(groupfield 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gro)u, | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670: ^15 /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h::432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here warning: 432 | initializer order does not match the declaration order [-Wreorder-ctor] if (t id < subtn670) Ru | nWor kColl()).run,(tid , sunbtn,t workh);reads(nthreads), tidInBl | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMock(threadIdx.x/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' ), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.hPLE_Sum_f3:2_4,303 ncc:lFu90ncAl:lRed uce, note: Funin instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested herecSum, f lo 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ at,303 NCCL | _ALGO _TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h4, nccl:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims FuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | Ru | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(thread/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize17_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Pr/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.hi:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | mitives, 0, warning s generated when compiling for Pgfx1200. roto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllRedu/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:303:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 303 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:17:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 4>::run' requested here 17 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 63 | Pri m670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing, 0, ProtoUNROLL,>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl prOLL_UNROLL>().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch,ims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEF/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:63:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 63 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 1, 2, 4>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:22:1: note: in instantiation of member function 'RunWorkBatch, 1, 2, 4>::run' requested here 22 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32_4, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE, 4) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1100. [ 66%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60402 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx906 --offload-arch=gfx908 --offload-arch=gfx90a --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: In file included from unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:12: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/collectives.h:15: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/device.h:14: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/include/rccl_float8.h:77:18: warning: unused variable 'y' [-Wunused-variable] 77 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group();In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ :15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ _group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1,In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp::2: In file included from 2/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: : /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5:In file included from warning: unused variable 'w' [-Wunused-variable] /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h80 | : 11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx 29 | . consxt in/t w =W threadAIdx.x/WARRP_SIZEP; \ | ^_ SIZE; \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - worIn file included from k->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from 80/builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174:: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: 5warning: unused variable 'w' [-Wunused-variable] 75 | : b awarning: runused variable 'w' [-Wunused-variable]r i 80 | er_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/W barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ ARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.chIn file included from annelId - /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cppwork->channelLo; | ^~~ :2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:75:7: warning: unused variable 'w' [-Wunused-variable] 75 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:174: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:14: warning: unused variable 'data1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:21: warning: unused variable 'flag1' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:28: warning: unused variable 'data2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll.h:145:35: warning: unused variable 'flag2' [-Wunused-variable] 145 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:175: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_ll128.h:80:5: warning: unused variable 'w' [-Wunused-variable] 80 | barrier_by_group(); | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:29:15: note: expanded from macro 'barrier_by_group' 29 | const int w = threadIdx.x/WARP_SIZE; \ | ^ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:27:15: warning: unused variable 'bid' [-Wunused-variable] 27 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:218:15: warning: unused variable 'bid' [-Wunused-variable] 218 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:366:15: warning: unused variable 'bid' [-Wunused-variable] 366 | const int bid = ncclShmem.channelId - work->channelLo; | ^~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | if (tid < subtn) RunWorkColl().run(tid, subtn, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWorkBatch, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64_2, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE, 2) | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:611:62: note: expanded from macro 'DEFINE_ncclDevFunc' 611 | RunWorkBatch, algo, proto, unroll>().run(); \ | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:60: note: field 'group' will be initialized after field 'stepSize' 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 671 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:254:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 254 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(tid, nthreads, work); | ^ /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/common.h:432:78: note: in instantiation of member function 'RunWorkColl, 0, 2, 2>::run' requested here 432 | In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/all_reduce.h:11: In file included from /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/primitives.h:173: /builddir/build/BUILD/rccl-6.4.2-build/rccl-rocm-6.4.2/redhat-linux-build/hipify/src/device/prims_simple.h:670:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 670 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gro iuf (tid